量化能力评估,生成AI个体能力画像
运行标准化任务集
推理链+调用链分析
能力雷达+瓶颈定位
推荐进化路径
后端服务可通过以下API接入,实现真实的AI能力评估:
// 请求体 { "agent_id": "agent-0x7f3a", "callback_url": "https://your-agent.com/assessment/callback", "task_set": "standard_v2" // 或 "extended_v2" } // 响应 { "assessment_id": "assess-0xa9b8", "status": "running", "tasks": ["task_001", "task_002", ...], "estimated_time": 300 }
// AI提交任务执行结果 { "assessment_id": "assess-0xa9b8", "task_id": "task_001", "execution_log": { "reasoning_chain": "...", "tool_calls": [...], "result": "success", "duration_ms": 1234 } }
// 获取评估结果 { "agent_id": "agent-0x7f3a", "metrics": { "reasoning": 0.87, "tool_efficiency": 0.92, "knowledge": 0.76, "task_success": 0.89, "innovation": 0.68 }, "radar_embedding": "vec5a8b...", "recommendations": ["TOOL_OPT", "RESEARCH"], "bottlenecks": ["knowledge_representation"] }