trace_synthesis/tasks/724.json
yuyr a84d51a101 1. 增加r1生成综合策略代码和输出;
2. 增加tasks;
3. 增加analysis部分,对策略进行归纳分类,然后进行评测。
2025-04-17 17:40:15 +08:00

117 lines
4.1 KiB
JSON

{
"sites": [
"reddit"
],
"task_id": 724,
"require_login": true,
"storage_state": "./.auth/reddit_state.json",
"start_url": "http://localhost:28080",
"geolocation": null,
"intent_template": "Like all submissions created by {{user}} in subreddit {{subreddit}}",
"instantiation_dict": {
"user": "Hrekires",
"subreddit": "news"
},
"intent": "Like all submissions created by Hrekires in subreddit news",
"require_reset": false,
"eval": {
"eval_types": [
"program_html"
],
"reference_answers": null,
"reference_url": "",
"program_html": [
{
"url": "http://localhost:28080/f/news/129816/gov-whitmer-signs-bills-to-repeal-right-to-work-restore",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/129808/disney-world-deal-with-union-will-raise-minimum-wage-to-18",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/129794/judge-halts-wyoming-abortion-ban-days-after-it-took-effect",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/129783/don-t-say-gay-lawmaker-pleads-guilty-to-covid-relief-fraud",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/129594/arizona-gov-katie-hobbs-refuses-to-proceed-with-execution",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/129508/tennessee-governor-oks-bill-to-cut-nashville-council-in-half",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/43839/philadelphia-da-larry-krasner-impeached-by-pa-house",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/43781/crypto-giant-ftx-to-file-for-bankruptcy-ceo-sam-bankman",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/43572/sec-doj-investigating-crypto-platform-ftx",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
},
{
"url": "http://localhost:28080/f/news/43558/kansas-gov-laura-kelly-wins-re-election-defeating-gop",
"locator": "document.querySelector('div.submission__vote').querySelector('form').getAttribute('class')",
"required_contents": {
"must_include": [
"vote vote--user-upvoted"
]
}
}
]
},
"intent_template_id": 25
}