{"id":"a76a87a9-31ae-4678-81bb-0adbde46309a","slug":"fangmenglin918-web-evaluation-skill","name":"evaluation","description":"通用产品功能评估方法论与工具集。用于：(1) 设计新功能的评估标准体系，(2) 创建评分Prompt实现LLM-as-a-Judge，(3) 分析人工与模型评分一致性，(4) 迭代优化评估标准和Prompt。适用于AI功能评测、对话质量评估、软硬件产品体验评估等场景。当用户需要设计评估体系、创建评分标准、分析评测数据或优化评测流程时使用此skill。","canonicalUrl":"https://xpersona.co/skill/fangmenglin918-web-evaluation-skill","sourceUrl":"https://github.com/fangmenglin918-web/evaluation-skill","homepage":null,"source":"GITHUB_OPENCLEW","vendor":{"slug":"fangmenglin918-web","label":"Fangmenglin918 Web","url":"https://github.com/fangmenglin918-web/evaluation-skill"},"protocols":["OPENCLEW"],"capabilities":[],"trustScore":null,"trustConfidence":"unknown","artifactCount":0,"benchmarkCount":0,"lastRelease":null,"freshnessAt":"2026-04-14T22:27:18.522Z","freshnessLabel":"Apr 14, 2026","securityReviewed":true,"openapiReady":false,"stats":[{"label":"Trust score","value":"Unknown"},{"label":"Compatibility","value":"OpenClaw"},{"label":"Freshness","value":"Apr 14, 2026"},{"label":"Vendor","value":"Fangmenglin918 Web"},{"label":"Artifacts","value":"0"},{"label":"Benchmarks","value":"0"},{"label":"Last release","value":"Unpublished"}],"factsPreview":[{"factKey":"docs_crawl","category":"integration","label":"Crawlable docs","value":"6 indexed pages on the official domain","href":"https://github.com/login?return_to=https%3A%2F%2Fgithub.com%2Fopenclaw%2Fskills%2Ftree%2Fmain%2Fskills%2Fasleep123%2Fcaldav-calendar","sourceUrl":"https://github.com/login?return_to=https%3A%2F%2Fgithub.com%2Fopenclaw%2Fskills%2Ftree%2Fmain%2Fskills%2Fasleep123%2Fcaldav-calendar","sourceType":"search_document","confidence":"medium","observedAt":"2026-04-15T05:03:46.393Z","isPublic":true},{"factKey":"vendor","category":"vendor","label":"Vendor","value":"Fangmenglin918 Web","href":"https://github.com/fangmenglin918-web/evaluation-skill","sourceUrl":"https://github.com/fangmenglin918-web/evaluation-skill","sourceType":"profile","confidence":"medium","observedAt":"2026-04-14T22:27:18.522Z","isPublic":true},{"factKey":"protocols","category":"compatibility","label":"Protocol compatibility","value":"OpenClaw","href":"https://xpersona.co/api/v1/agents/fangmenglin918-web-evaluation-skill/contract","sourceUrl":"https://xpersona.co/api/v1/agents/fangmenglin918-web-evaluation-skill/contract","sourceType":"contract","confidence":"medium","observedAt":"2026-04-14T22:27:18.522Z","isPublic":true},{"factKey":"traction","category":"adoption","label":"Adoption signal","value":"4 GitHub stars","href":"https://github.com/fangmenglin918-web/evaluation-skill","sourceUrl":"https://github.com/fangmenglin918-web/evaluation-skill","sourceType":"profile","confidence":"medium","observedAt":"2026-04-14T22:27:18.522Z","isPublic":true},{"factKey":"handshake_status","category":"security","label":"Handshake status","value":"UNKNOWN","href":"https://xpersona.co/api/v1/agents/fangmenglin918-web-evaluation-skill/trust","sourceUrl":"https://xpersona.co/api/v1/agents/fangmenglin918-web-evaluation-skill/trust","sourceType":"trust","confidence":"medium","observedAt":null,"isPublic":true}],"highlights":["4 GitHub stars","Trust evidence available"],"agentCard":{"name":"evaluation","description":"通用产品功能评估方法论与工具集。用于：(1) 设计新功能的评估标准体系，(2) 创建评分Prompt实现LLM-as-a-Judge，(3) 分析人工与模型评分一致性，(4) 迭代优化评估标准和Prompt。适用于AI功能评测、对话质量评估、软硬件产品体验评估等场景。当用户需要设计评估体系、创建评分标准、分析评测数据或优化评测流程时使用此skill。","source":"GITHUB_OPENCLEW","sourceId":"github:1139719105","repository":"https://github.com/fangmenglin918-web/evaluation-skill","documentation":"https://xpersona.co/skill/fangmenglin918-web-evaluation-skill/agent/fangmenglin918-web-evaluation-skill","protocols":["OPENCLEW"],"languages":["typescript"],"install":{"command":"git clone https://github.com/fangmenglin918-web/evaluation-skill.git","ecosystem":"git"},"examples":[{"kind":"example","language":"text","snippet":"定义功能 → 拆解维度 → 制定标准 → 人工打分基准\n    ↑                                    ↓\n循环迭代 ← 一致性对比 ← 模型跑分 ← Prompt优化 ← 标准优化"},{"kind":"example","language":"text","snippet":"1. 角色设定（严苛的审计员）\n2. 任务背景（评估场景和目标）\n3. 评分档位定义（0-4分详细条款）\n4. 打分流程（倒金字塔筛选）\n5. 输入格式说明\n6. 输出格式规范（JSON）\n7. 典型案例参考"}]}}