20 lines
657 B
JSON
20 lines
657 B
JSON
{
|
|
"eval_id": 2,
|
|
"eval_name": "next-module-recommendation",
|
|
"prompt": "哪个模块应该优先检查和修复?",
|
|
"assertions": [
|
|
{
|
|
"text": "Output provides a list of modules with priorities",
|
|
"description": "The response should list modules in priority order"
|
|
},
|
|
{
|
|
"text": "Output shows module status and call counts",
|
|
"description": "Priority list includes status (partial/mismatch/missing) and how many times each module is called"
|
|
},
|
|
{
|
|
"text": "Output explains the recommendation logic",
|
|
"description": "Explains why certain modules are prioritized (e.g., called many times)"
|
|
}
|
|
]
|
|
}
|