trace_synthesis/tasks/562.json
yuyr a84d51a101 1. 增加r1生成综合策略代码和输出;
2. 增加tasks;
3. 增加analysis部分,对策略进行归纳分类,然后进行评测。
2025-04-17 17:40:15 +08:00

42 lines
1.5 KiB
JSON

{
"sites": [
"gitlab",
"reddit"
],
"task_id": 562,
"require_login": true,
"storage_state": "./.auth/gitlab.reddit_state.json",
"start_url": "http://localhost:28084",
"geolocation": null,
"intent_template": "create a repository named {{name}} that includes a README file with the links to the most active {{num}} DIY ideas on DIY subreddit?",
"instantiation_dict": {
"name": "Awesome_DIY_ideas",
"num": 6
},
"intent": "create a repository named Awesome_DIY_ideas that includes a README file with the links to the most active 6 DIY ideas on DIY subreddit?",
"require_reset": false,
"eval": {
"eval_types": [
"program_html"
],
"reference_answers": null,
"reference_url": "",
"program_html": [
{
"url": "http://localhost:28084/byteblaze/Awesome_DIY_ideas/-/raw/main/README.md",
"locator": "",
"required_contents": {
"must_include": [
"http://localhost:28080/f/DIY/118903/separate-glued-plastic-parts",
"http://localhost:28080/f/DIY/118923/how-would-you-fix-this-dryer-vent-mess",
"http://localhost:28080/f/DIY/118935/basement-bulkhead-soffit-wall-framing",
"http://localhost:28080/f/DIY/118904/ge-water-heater-pilot-light-won-t-stay-lit",
"http://localhost:28080/f/DIY/118960/attempting-to-move-a-wall-outlet-in-my-basement-a-few-inches",
"http://localhost:28080/f/DIY/118931/afci-outlet-question"
]
}
}
]
},
"intent_template_id": 88
}