{"eval":{"version":"openagentskill-skill-eval-v1","slug":"baidubce-app-builder","name":"App Builder","generated_at":"2026-07-03T21:44:16.358Z","task_input":"Evaluate App Builder before installing it in an AI agent workflow","status":"review","score":79,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Review the audit page, then allow agent install in a sandboxed workflow.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":84,"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Chunk documents","Create embeddings"],"suited_agents":["Python","RAG","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add baidubce/app-builder","ready":true,"policy":"review","safety_label":"Review before install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add baidubce/app-builder"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"App Builder\" agent skill from https://github.com/baidubce/app-builder. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"App Builder\" as a Claude Code skill from https://github.com/baidubce/app-builder. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"App Builder\" from https://github.com/baidubce/app-builder into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"}]},"trust":{"score":80,"label":"Strong shortlist","version":"trust-score-v4","evidence":{"stars":"583 GitHub stars","repoActivity":"583 stars, 143 forks","lastPushed":"2mo since push","license":"Apache-2.0","repository":"https://github.com/baidubce/app-builder","install":"npx skills add baidubce/app-builder","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":83,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Quality score needs review","Documentation summary is thin"]},"safety_gate":{"score":71,"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"}],"policy_warnings":["Quality score needs review"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":84,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate App Builder before installing it in an AI agent workflow","data","Coding agents workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add baidubce/app-builder"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add baidubce/app-builder"]},{"id":"trust_score","label":"Trust score","status":"warn","score":80,"required_for_auto_install":true,"detail":"Good trust signals with a few areas worth checking before rollout.","evidence":["Strong shortlist","583 GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"pass","score":83,"required_for_auto_install":true,"detail":"Safe to try","evidence":["Quality score needs review"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":71,"required_for_auto_install":true,"detail":"Good audit and safety signals with no high-risk permission hints in public metadata.","evidence":["Review the audit page, then allow agent install in a sandboxed workflow.","Safe-to-try audit"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"warn","score":74,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Usable metadata, review docs"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":88,"required_for_auto_install":false,"detail":"2mo since push","evidence":["2mo since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"network or browser access","evidence":["Network access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["shubhamsaboo-awesome-llm-apps","datawhalechina-hello-agents","pathwaycom-llm-app","flowiseai-flowise"]}],"blockers":[],"warnings":["Trust score: Good trust signals with a few areas worth checking before rollout.","Agent safety gate: Good audit and safety signals with no high-risk permission hints in public metadata.","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Quality score needs review","Documentation summary is thin"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","Quality score needs review","Documentation summary is thin","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface","Automatic installation in a production workspace"],"alternatives":[{"slug":"shubhamsaboo-awesome-llm-apps","name":"Awesome Llm Apps","url":"https://www.openagentskill.com/skills/shubhamsaboo-awesome-llm-apps","stars":114473,"install_command":"npx skills add Shubhamsaboo/awesome-llm-apps","trust_score":93,"audit_score":95},{"slug":"datawhalechina-hello-agents","name":"Hello Agents","url":"https://www.openagentskill.com/skills/datawhalechina-hello-agents","stars":59476,"install_command":"npx skills add datawhalechina/hello-agents","trust_score":86,"audit_score":92},{"slug":"pathwaycom-llm-app","name":"Llm App","url":"https://www.openagentskill.com/skills/pathwaycom-llm-app","stars":59299,"install_command":"npx skills add pathwaycom/llm-app","trust_score":93,"audit_score":95},{"slug":"flowiseai-flowise","name":"Flowise","url":"https://www.openagentskill.com/skills/flowiseai-flowise","stars":53579,"install_command":"npx skills add FlowiseAI/Flowise","trust_score":88,"audit_score":92}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"baidubce-app-builder","name":"App Builder","description":"appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用","category":"data","url":"https://www.openagentskill.com/skills/baidubce-app-builder","repository":"https://github.com/baidubce/app-builder","github_repo":"baidubce/app-builder"},"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Chunk documents","Create embeddings"],"suited_agents":["Python","RAG","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add baidubce/app-builder","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add baidubce/app-builder"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"App Builder\" agent skill from https://github.com/baidubce/app-builder. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"App Builder\" as a Claude Code skill from https://github.com/baidubce/app-builder. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"App Builder\" from https://github.com/baidubce/app-builder into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: appbuilder-sdk, 千帆AppBuilder-SDK帮助开发者灵活、快速的搭建AI原生应用"}],"handoff_url":"https://www.openagentskill.com/api/skills/baidubce-app-builder/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/baidubce-app-builder"},"trust":{"score":80,"label":"Strong shortlist","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"583 GitHub stars","repoActivity":"583 stars, 143 forks","lastPushed":"2mo since push","license":"Apache-2.0","repository":"https://github.com/baidubce/app-builder","install":"npx skills add baidubce/app-builder","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["data","rag","retrieval","agent","ai-native","appbuilder"],"known_risks":["Quality score needs review","Documentation summary is thin"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":83,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Quality score needs review","Documentation summary is thin"]},"safety_gate":{"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow."},"quality":{"score":79,"label":"Strong"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"2mo since push","risk":"Safe to try"},"alternative_skills":[{"slug":"shubhamsaboo-awesome-llm-apps","name":"Awesome Llm Apps","url":"https://www.openagentskill.com/skills/shubhamsaboo-awesome-llm-apps","stars":114473,"install_command":"npx skills add Shubhamsaboo/awesome-llm-apps","trust_score":93,"audit_score":95},{"slug":"datawhalechina-hello-agents","name":"Hello Agents","url":"https://www.openagentskill.com/skills/datawhalechina-hello-agents","stars":59476,"install_command":"npx skills add datawhalechina/hello-agents","trust_score":86,"audit_score":92},{"slug":"pathwaycom-llm-app","name":"Llm App","url":"https://www.openagentskill.com/skills/pathwaycom-llm-app","stars":59299,"install_command":"npx skills add pathwaycom/llm-app","trust_score":93,"audit_score":95},{"slug":"flowiseai-flowise","name":"Flowise","url":"https://www.openagentskill.com/skills/flowiseai-flowise","stars":53579,"install_command":"npx skills add FlowiseAI/Flowise","trust_score":88,"audit_score":92}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","Quality score needs review","Documentation summary is thin","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface","Automatic installation in a production workspace"],"agent_contract":{"task_input":"Evaluate App Builder before installing it in an AI agent workflow","recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow.","install_policy":"review","minimum_review_before_use":["Trust: 80/100 Strong shortlist","Audit: 83/100 Safe to try","Safety: 71/100 Review before install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"baidubce-app-builder (App Builder)","install_command":"npx skills add baidubce/app-builder","risk_summary":"Safe to try; Reviewed; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"baidubce-app-builder","task":"Evaluate App Builder before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/baidubce-app-builder","api":"https://www.openagentskill.com/api/agent/skills/baidubce-app-builder","audit":"https://www.openagentskill.com/skills/baidubce-app-builder/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=baidubce-app-builder&task=Evaluate%20App%20Builder%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20App%20Builder%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20App%20Builder%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/baidubce-app-builder/install","manifest":"https://www.openagentskill.com/api/registry/manifest/baidubce-app-builder"}},"endpoints":{"web":"https://www.openagentskill.com/skills/baidubce-app-builder","api":"https://www.openagentskill.com/api/agent/skills/baidubce-app-builder","eval":"https://www.openagentskill.com/api/agent/evals?slug=baidubce-app-builder","audit":"https://www.openagentskill.com/skills/baidubce-app-builder/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20App%20Builder%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T21:44:16.358Z"}}