18641 lines
697 KiB
JSON
18641 lines
697 KiB
JSON
[
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 0,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the least expensive {{product}} from \"{{category}}\" category.",
|
|
"intent": "Buy the least expensive red blanket (in any size) from \"Blankets & Throws\" category.",
|
|
"instantiation_dict": {
|
|
"category": "Blankets & Throws",
|
|
"product": "red blanket (in any size)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0983XCYK6",
|
|
"Red"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 0,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 1,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the least expensive {{product}} from \"{{category}}\" category.",
|
|
"intent": "Buy the least expensive blue headset from \"Virtual Reality (VR) Headsets\" category.",
|
|
"instantiation_dict": {
|
|
"category": "Virtual Reality (VR) Headsets",
|
|
"product": "blue headset"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09MP3SGPN"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 0,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 2,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the least expensive {{product}} from \"{{category}}\" category.",
|
|
"intent": "Buy the least expensive canvas print with grapes from \"Posters & Prints\" category.",
|
|
"instantiation_dict": {
|
|
"category": "Posters & Prints",
|
|
"product": "canvas print with grapes"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08ZCCRMH4"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 0,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 3,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am doing a market survey for one stop market, show me the most expensive {{product}} from \"{{product_category}}\" category",
|
|
"intent": "I am doing a market survey for one stop market, show me the most expensive red controller from \"PS4 accessories\" category",
|
|
"instantiation_dict": {
|
|
"product": "red controller",
|
|
"product_category": "PS4 accessories"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/dualshock-4-wireless-controller-for-playstation-4-magma-red.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 1,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 4,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am doing a market survey for one stop market, show me the most expensive {{product}} from \"{{product_category}}\" category",
|
|
"intent": "I am doing a market survey for one stop market, show me the most expensive black and white item from \"Posters & Prints\" category",
|
|
"instantiation_dict": {
|
|
"product": "black and white item",
|
|
"product_category": "Posters & Prints"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/signature-design-by-ashley-pancho-modern-framed-cow-canvas-wall-art-48-x-36-black-white.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 1,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 5,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am doing a market survey for one stop market, show me the most expensive {{product}} from \"{{product_category}}\" category",
|
|
"intent": "I am doing a market survey for one stop market, show me the most expensive yellow product from \"Dried Fruits & Vegetables\" category",
|
|
"instantiation_dict": {
|
|
"product": "yellow product",
|
|
"product_category": "Dried Fruits & Vegetables"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sun-maid-california-golden-raisins-15-ounce-boxes-pack-of-24.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 1,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 6,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}}List the full product names of {{color}} {{product}} and tell me the price range of the available products",
|
|
"intent": "Search for 'Nike slide slippers'. List the full product names of red ones on the first page and tell me the price range of the available products",
|
|
"instantiation_dict": {
|
|
"modifier": "Search for 'Nike slide slippers'. ",
|
|
"color": "red",
|
|
"product": "ones on the first page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Nike Men's Air Max Camden Slide Sandal",
|
|
"Nike Men's Benassi JDI Fanny Pack Slides",
|
|
"Nike Offcourt Slide Mens Bq4639-002 Size 12",
|
|
"Nike Jordan Men's Break Slide Red AR6374-602",
|
|
"42.81",
|
|
"69.00"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "These models are availiable: Nike Men's Air Max Camden Slide Sandal, Nike Men's Benassi JDI Fanny Pack Slides, Nike Offcourt Slide Mens Bq4639-002 Size 12, Nike Jordan Men's Break Slide Red AR6374-602. The price ranges from $42.81 to $69.00"
|
|
},
|
|
"intent_template_id": 2,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 7,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}}List the full product names of {{color}} {{product}} and tell me the price range of the available products",
|
|
"intent": "Search for 'pencil case'. List the full product names of those with animal designs on the first page and tell me the price range of the available products",
|
|
"instantiation_dict": {
|
|
"modifier": "Search for 'pencil case'. ",
|
|
"color": "those with",
|
|
"product": "animal designs on the first page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Cosmetic Bag Leather Pencil Case,Cosmetic Bag Leather Pencil Case,Two Wolves,Portable Small Makeup Bags Travel bag Multifunctional Pen Holder Box with Zipper for Women Girls Lady Teens",
|
|
"Danielle Cute Boston Terrier, Frenchie, French Bulldog Portable Pencil Case, Cosmetic Travel Organizer Bag | 9x3x3 in",
|
|
"Dinosaur Pattern Travel Bag Large Toiletries Bag Cosmetic Pouch Pencil Case Tote Multifunction Organizer Storage Bag",
|
|
"Leopard Paw Cosmetic Bag Pink Makeup Bag for Girls Women Portable Travel Pencil Case Water-resistant Organizer Birthday Christmas Gift",
|
|
"5.99",
|
|
"38.67"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 2,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 8,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=+Lays",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}}List the full product names of {{color}} {{product}} and tell me the price range of the available products",
|
|
"intent": "List the full product names of red packaging Lays chips on this page and tell me the price range of the available products",
|
|
"instantiation_dict": {
|
|
"modifier": "",
|
|
"color": "red packaging",
|
|
"product": "Lays chips on this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Canadian Lays Ketchup Chips - 1 Family Size Bag",
|
|
"Canadian Lays Ketchup Potato Chips (4pk) 180g/6.3 oz., {Imported from Canada}",
|
|
"LAYS Brand , Crispy Potato Chips Smoked Salmon Cream Cheese Flavour, 67g X 2 Packs",
|
|
"11.85",
|
|
"38.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "These are availiable: Canadian Lays Ketchup Chips - 1 Family Size Bag, Canadian Lays Ketchup Potato Chips (4pk) 180g/6.3 oz., {Imported from Canada}, LAYS Brand , Crispy Potato Chips Smoked Salmon Cream Cheese Flavour, 67g X 2 Packs. The price ranges from $11.85 to $38.99"
|
|
},
|
|
"intent_template_id": 2,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 9,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the {{order}} in the \"{{product}}\" search results by {{sorting_order}}.",
|
|
"instantiation_dict": {
|
|
"order": "first item in the second row",
|
|
"product": "chairs",
|
|
"sorting_order": "descending price"
|
|
},
|
|
"intent": "Show me the first item in the second row in the \"chairs\" search results by descending price.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/oeukji-office-chairs-office-products-boss-chair-business-home-office-chair-reclining-computer-chair-leather-boss-chair-swivel-chair-executive-chair.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 3,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 10,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the {{order}} in the \"{{product}}\" search results by {{sorting_order}}.",
|
|
"instantiation_dict": {
|
|
"order": "third item in the second row",
|
|
"product": "frozen pizza",
|
|
"sorting_order": "descending price"
|
|
},
|
|
"intent": "Show me the third item in the second row in the \"frozen pizza\" search results by descending price.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/portobello-arancini-bites-gourmet-frozen-appetizers-set-of-8-trays.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 3,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 11,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the {{order}} in the \"{{product}}\" search results by {{sorting_order}}.",
|
|
"instantiation_dict": {
|
|
"order": "first item with round cookies",
|
|
"product": "ice cream sandwiches",
|
|
"sorting_order": "descending relevance"
|
|
},
|
|
"intent": "Show me the first item with round cookies in the \"ice cream sandwiches\" search results by descending relevance.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/skinny-cow-gone-wild-low-fat-ice-cream-sandwiches-box-vanilla-24-fl-oz-pack-of-6.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 3,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 12,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the {{order}} in the \"{{product}}\" search results by {{sorting_order}}.",
|
|
"instantiation_dict": {
|
|
"order": "first painting",
|
|
"product": "van gogh",
|
|
"sorting_order": "descending relevance"
|
|
},
|
|
"intent": "Show me the first painting in the \"van gogh\" search results by descending relevance.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/decorarts-cafe-terrace-at-night-vincent-van-gogh-art-reproduction-giclee-canvas-prints-wall-art-for-home-decor-30x24.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 3,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 13,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"instantiation_dict": {
|
|
"region": "first row of this page"
|
|
},
|
|
"intent": "What is the price range for products in the first row of this page?",
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"14.47",
|
|
"23.50"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$14.47 - $23.50"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 14,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/nintendo-switch.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"instantiation_dict": {
|
|
"region": "last row of this page"
|
|
},
|
|
"intent": "What is the price range for products in the last row of this page?",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"4.95",
|
|
"43.00"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$4.95 - $43.00"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 15,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/sport-specific-clothing/competitive-swimwear.html?product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"instantiation_dict": {
|
|
"region": "second and third rows of this page"
|
|
},
|
|
"intent": "What is the price range for products in the second and third rows of this page?",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"4.99",
|
|
"16.09"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$4.99 - $16.09"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 16,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-electronics/printers-accessories.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"instantiation_dict": {
|
|
"region": "first column of this page"
|
|
},
|
|
"intent": "What is the price range for products in the first column of this page?",
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"47.69",
|
|
"488.83"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$47.69 - $488.83"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 17,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/video-projectors.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"instantiation_dict": {
|
|
"region": "last column of this page"
|
|
},
|
|
"intent": "What is the price range for products in the last column of this page?",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"123.41",
|
|
"184.59"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$123.41 - $184.59"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 18,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price of the most expensive {{color}} product in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"color": "red",
|
|
"product_category": "Basic Cases"
|
|
},
|
|
"intent": "What is the price of the most expensive red product in the \"Basic Cases\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"42.98"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$42.98"
|
|
},
|
|
"intent_template_id": 5,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 19,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price of the most expensive {{color}} product in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"color": "feather lamp",
|
|
"product_category": "Lamps & Shades"
|
|
},
|
|
"intent": "What is the price of the most expensive feather lamp product in the \"Lamps & Shades\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"920.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$920.99"
|
|
},
|
|
"intent_template_id": 5,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 20,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price of the most expensive {{color}} product in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"color": "blue",
|
|
"product_category": "Posters & Prints"
|
|
},
|
|
"intent": "What is the price of the most expensive blue product in the \"Posters & Prints\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"399.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$399.99"
|
|
},
|
|
"intent_template_id": 5,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 21,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the color of the {{type}} item in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"type": "most expensive",
|
|
"product_category": "Over-Ear Headphones"
|
|
},
|
|
"intent": "What is the color of the most expensive item in the \"Over-Ear Headphones\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"black"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "black"
|
|
},
|
|
"intent_template_id": 6,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 22,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the color of the {{type}} item in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"type": "second cheapest",
|
|
"product_category": "Snack Gifts"
|
|
},
|
|
"intent": "What is the color of the second cheapest item in the \"Snack Gifts\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"red |OR| yellow"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "red and yellow"
|
|
},
|
|
"intent_template_id": 6,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 23,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the color of the {{type}} item in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"type": "third most expensive",
|
|
"product_category": "Exercise & Fitness"
|
|
},
|
|
"intent": "What is the color of the third most expensive item in the \"Exercise & Fitness\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"red"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "red"
|
|
},
|
|
"intent_template_id": 6,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 24,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Search for \"{{keyword}}\" and show me the {{item_order}} item {{condition}}",
|
|
"instantiation_dict": {
|
|
"keyword": "usb wifi",
|
|
"item_order": "first",
|
|
"condition": "in the second row"
|
|
},
|
|
"intent": "Search for \"usb wifi\" and show me the first item in the second row",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/edup-usb-wifi-adapter-dual-band-wireless-network-adapter-802-11-ac-2-4g-5g-usb-wi-fi-dongle-with-extender-antenna-compatible-with-windows-xp-vista-7-8-1-10-mac-os-x-10-7-10-15.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 7,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 25,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Search for \"{{keyword}}\" and show me the {{item_order}} item {{condition}}",
|
|
"instantiation_dict": {
|
|
"keyword": "raincoat",
|
|
"item_order": "first",
|
|
"condition": "that is blue in color"
|
|
},
|
|
"intent": "Search for \"raincoat\" and show me the first item that is blue in color",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/wuai-women-oversized-raincoats-rain-jackets-plus-size-lightweight-waterproof-trench-coat-outdoor-packable-windbreaker-s-5xl.html |OR| __SHOPPING__/jspoyou-mens-windproof-rain-jacket-detachable-hooded-lightweight-breathable-trench-coat-winter-warm-packable-raincoat-outwear.html |OR| __SHOPPING__/lightweight-hooded-rain-coat-womens-waterproof-zipper-jacket-windproof-waterproof-raincoat-jacket-light-comfy-outdoor.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 7,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 26,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Search for \"{{keyword}}\" and show me the {{item_order}} item {{condition}}",
|
|
"instantiation_dict": {
|
|
"keyword": "plush toy",
|
|
"item_order": "first",
|
|
"condition": "that is pink in color"
|
|
},
|
|
"intent": "Search for \"plush toy\" and show me the first item that is pink in color",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/olpchee-foldable-plush-children-s-sofa-backrest-chair-cute-cartoon-infant-baby-seat-for-living-room-bedroom-corgi.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 7,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 27,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the first {{design}} in the search results for \"{{product}}\".",
|
|
"instantiation_dict": {
|
|
"design": "white table",
|
|
"product": "table"
|
|
},
|
|
"intent": "Show me the first white table in the search results for \"table\".",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/n-a-yyhen-beautiful-three-legged-wooden-coffee-tableiving-room-balcony-simple-end-table-white.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 8,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 28,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the first {{design}} in the search results for \"{{product}}\".",
|
|
"instantiation_dict": {
|
|
"design": "rainbow colored coat",
|
|
"product": "winter coat"
|
|
},
|
|
"intent": "Show me the first rainbow colored coat in the search results for \"winter coat\".",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/winter-coat-men-fashion-casual-buckle-lapels-printed-single-breasted-suit-jacket.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 8,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 29,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the first {{design}} in the search results for \"{{product}}\".",
|
|
"instantiation_dict": {
|
|
"design": "red coat",
|
|
"product": "winter coat"
|
|
},
|
|
"intent": "Show me the first red coat in the search results for \"winter coat\".",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/smooto-winter-coats-women-s-warm-hooded-thick-padded-outerwear-jackets-overcoat.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 8,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 30,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the first {{design}} in the search results for \"{{product}}\".",
|
|
"instantiation_dict": {
|
|
"design": "coat with a furry hood",
|
|
"product": "winter coat"
|
|
},
|
|
"intent": "Show me the first coat with a furry hood in the search results for \"winter coat\".",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/charmap-winter-coats-for-women-warm-coat-jacket-outwear-faux-fur-lined-trench-winter-hooded-thick-overcoat.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 8,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 31,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Explore the \"{{category}}\" category listed by ascending price and add the first {{design}} item to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"category": "Headphones",
|
|
"design": "blue"
|
|
},
|
|
"intent": "Explore the \"Headphones\" category listed by ascending price and add the first blue item to my shopping cart.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Audio-Technica ATH-CLR100iSBL SonicFuel In-Ear Headphones with In-Line Microphone & Control, Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 9,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 32,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Explore the \"{{category}}\" category listed by ascending price and add the first {{design}} item to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"category": "Makeup Palettes",
|
|
"design": "blue palette"
|
|
},
|
|
"intent": "Explore the \"Makeup Palettes\" category listed by ascending price and add the first blue palette item to my shopping cart.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Cosmetic Matte Eyeshadow Cream Christmas Makeup Palette-Shimmer Set, 9 Colors Waterproof Eyeshadow Palettes Contour Palettes Powder Shimmer (A)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 9,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 33,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Explore the \"{{category}}\" category listed by ascending price and tell me the color of the {{order}} item in the first row.",
|
|
"instantiation_dict": {
|
|
"category": "Competitive Swimwear",
|
|
"order": "second"
|
|
},
|
|
"intent": "Explore the \"Competitive Swimwear\" category listed by ascending price and tell me the color of the second item in the first row.",
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"pink"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "pink"
|
|
},
|
|
"intent_template_id": 10,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 34,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Explore the \"{{category}}\" category listed by ascending price and tell me the colors of the {{order}} item in the first row.",
|
|
"instantiation_dict": {
|
|
"category": "Artificial Plants & Flowers",
|
|
"order": "first"
|
|
},
|
|
"intent": "Explore the \"Artificial Plants & Flowers\" category listed by ascending price and tell me the colors of the first item in the first row.",
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"red"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "red and green"
|
|
},
|
|
"intent_template_id": 11,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 35,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Explore the \"{{category}}\" category listed by ascending price and tell me the color of the {{order}} item in the first row.",
|
|
"instantiation_dict": {
|
|
"category": "Patio Furniture & Accessories",
|
|
"order": "fourth"
|
|
},
|
|
"intent": "Explore the \"Patio Furniture & Accessories\" category listed by ascending price and tell me the color of the fourth item in the first row.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"one_of": [
|
|
"yellow",
|
|
"gold"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "yellow"
|
|
},
|
|
"intent_template_id": 10,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 36,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/dairy-cheese-eggs/cheese.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "round cheese",
|
|
"location": "first row of this page"
|
|
},
|
|
"intent": "Add the round cheese in the first row of this page to my wish list.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Queijo Minas Mineiro Curado Brazilian Minas Cheese Gourmet Aged Cheese"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 37,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/bedding/blankets-throws.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "navy blue one in the second column"
|
|
},
|
|
"intent": "Add the navy blue one in the second column to my wish list.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"PEACE NEST Lightweight Down and Feather Fiber Throw Blanket Soft Couch Throw for Indoor and Outdoor Use, 50\"x70\", Navy Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 38,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/uniforms-work-safety.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "pink ones on this page"
|
|
},
|
|
"intent": "Add the pink ones on this page to my wish list.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wukong Direct Pants Practice Pants Cotton Pants Comfortable Breathable Bloomers Yoga"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 39,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/oral-care/orthodontic-supplies.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "colorful thing on this page"
|
|
},
|
|
"intent": "Add the colorful thing on this page to my wish list.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"50Pcs/Bag Disposable Plastic Elastic Placers Dental Elastic Rubber Band Dental Orthodontic Product Multi Color"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 40,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} and price of the cheapest item in the \"{{category}}\" category?",
|
|
"instantiation_dict": {
|
|
"attribute": "shape",
|
|
"category": "Chocolate"
|
|
},
|
|
"intent": "What is the shape and price of the cheapest item in the \"Chocolate\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"one_of": [
|
|
"circular",
|
|
"circle",
|
|
"sphere",
|
|
"round"
|
|
],
|
|
"must_include": [
|
|
"1.04"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "circle, $1.04"
|
|
},
|
|
"intent_template_id": 14,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 41,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} and price of the cheapest item in the \"{{category}}\" category?",
|
|
"instantiation_dict": {
|
|
"attribute": "color",
|
|
"category": "Men's Uniforms, Work & Safety"
|
|
},
|
|
"intent": "What is the color and price of the cheapest item in the \"Men's Uniforms, Work & Safety\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"white",
|
|
"0.19"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "white, $0.19"
|
|
},
|
|
"intent_template_id": 14,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 42,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} and price of the cheapest item in the \"{{category}}\" category?",
|
|
"instantiation_dict": {
|
|
"attribute": "color",
|
|
"category": "Decorative Pillows, Inserts & Covers"
|
|
},
|
|
"intent": "What is the color and price of the cheapest item in the \"Decorative Pillows, Inserts & Covers\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"black",
|
|
"1.93"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "black, $1.93"
|
|
},
|
|
"intent_template_id": 14,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 43,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest item in the \"{{category}}\" category that comes in {{shape}}.",
|
|
"instantiation_dict": {
|
|
"category": "Soups, Stocks & Broths",
|
|
"shape": "rectangular packaging"
|
|
},
|
|
"intent": "Find me the cheapest item in the \"Soups, Stocks & Broths\" category that comes in rectangular packaging.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/ocean-s-halo-organic-and-vegan-no-chicken-broth-32-oz-per-unit-2-pack.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 15,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 44,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest item in the \"{{category}}\" category that comes in {{shape}}.",
|
|
"instantiation_dict": {
|
|
"category": "Posters & Prints",
|
|
"shape": "blue"
|
|
},
|
|
"intent": "Find me the cheapest item in the \"Posters & Prints\" category that comes in blue.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/palacelearning-the-starry-night-1889-by-vincent-van-gogh-fine-art-poster-wall-art-print-laminated-18-x-24.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 15,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 45,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest item in the \"{{category}}\" category that comes in {{shape}}.",
|
|
"instantiation_dict": {
|
|
"category": "Children's Dental Care",
|
|
"shape": "the style of a cupcake"
|
|
},
|
|
"intent": "Find me the cheapest item in the \"Children's Dental Care\" category that comes in the style of a cupcake.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/children-s-toothbrush-u-shaped-age-2-12-kids-silicone-toothbrush-food-soft-silicone-brush-head-with-cute-cake-look.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 15,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 46,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/kitchen-dining/kitchen-table-linens.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{attribute}} one in the {{order}} to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"attribute": "red",
|
|
"order": "second row of this page"
|
|
},
|
|
"intent": "Add the red one in the second row of this page to my shopping cart.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ARTSHOWING Anchor Table Runner and Placemats Set of 6, Burlap Linen Table Runners 13x90inch, Heat-Insulating Placemats for Table Decor, Love The Life You Live"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 16,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 47,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/home-decor-products/artificial-plants-flowers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{attribute}} one in the {{order}} to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"attribute": "yellow",
|
|
"order": "first row of this page"
|
|
},
|
|
"intent": "Add the yellow one in the first row of this page to my shopping cart.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Csyidio 6 Bundles Artificial Daisy Flowers Plastic Flowers Outdoor UV Resistant Plants Shrubs for Garden Porch Hanging Planter Window Box Decor(Yellow)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 16,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 48,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-furniture-lighting/chairs-sofas.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{attribute}} one in the {{order}} to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"attribute": "white",
|
|
"order": "bottom row of this page"
|
|
},
|
|
"intent": "Add the white one in the bottom row of this page to my shopping cart.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"YAMASORO Ergonomic Executive Office Chair White High Back Leather Computer Chair,Office Desk Chair with Arms and Wheels"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 16,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 49,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"intent": "Add the green checkered polo shirt (in any size) on this page to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "green checkered polo shirt (in any size) on this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Men & Boy Long Sleeve Flannel Plaid Casual Shirts Button Down Regular Fit Long Sleeve Cotton Polo Shirt L-5XL"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 50,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/clothing.html?p=2&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"intent": "Add the neon green shirt to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "neon green shirt"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Short Sleeve Dry-Fit Workout Shirt - Loppet, 2-Pack"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 51,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/home-office-furniture.html?p=4&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} {{condition}} to my wish list.",
|
|
"intent": "Add the pink bookcase that looks like a pig to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "pink bookcase",
|
|
"condition": "that looks like a pig"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Home Bookshelf Bookcase Shelf Bookshelf Book Shelves Simple Student Desktop Small Picture Book Storage Household Simple Floor Living Room Children's Bookcase Durable Bookcase Display Shelf Storage Org"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 17,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 52,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/gardening-lawn-care/pots-planters-container-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} {{condition}} to my wish list.",
|
|
"intent": "Add the one that looks like a wooden log to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "one",
|
|
"condition": "that looks like a wooden log"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"REAL Planters H-2 Horizontal Log Planter, Medium, Oak"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 17,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 53,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/footwear.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} to my wish list.",
|
|
"intent": "Add the blue and orange one to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "blue and orange one"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SKICKS Florida Gators Slip-On Sneaker - Adult Unisex"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 13,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 54,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} {{condition}} to my wish list.",
|
|
"intent": "Add the one with waves to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "one",
|
|
"condition": "with waves"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SiMiWOW Beach Lighthouse Wall Art Blue Ocean Coastal Painting Canvas Print Framed Artwork Bathroom Bedroom Living Room Decor 16\"x24\""
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 17,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 55,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html?product_list_order=price",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the first one in the second row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "first one",
|
|
"location": "second row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"QTESPEII Framed Kitchen Pictures Wall Art Decor Green Grape and Red Wine Canvas Prints"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 56,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/skin-care/sunscreens-tanning-products.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the orange one in the first row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "orange one",
|
|
"location": "first row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Banana Boat Ultra Sport Sunscreen Lotion, Broad Spectum SPF 30, 8 Fl Oz"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 57,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/home-decor-products/artificial-plants-flowers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} {{condition}} to my wish list.",
|
|
"intent": "Add the one on this page with 'garden' written on it to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "one on this page",
|
|
"condition": "with 'garden' written on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Artificial Succulent Plant Pot Milk White Ceramic Flowerpot Wine Bottle can Shape Home Office Desktop Countertop Decoration Small Potted Plant (ws8003)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 17,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 58,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/game-recreation-room-furniture.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the brown one in the first row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "brown one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Set of 2 Bar Stools Pub Chair Fabric w/Wood Legs Backrest Home Furniture Brown HilariousM Stoolseating Office Chair Desk Chair Bar stools Folding Table Step Stool Folding Chair Patio Chair"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 59,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/home-decor-products/artificial-plants-flowers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the yellow one in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "yellow one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"37.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$8.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 60,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/health-care.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}}.",
|
|
"intent": "Tell me the price of the purple one on this page.",
|
|
"instantiation_dict": {
|
|
"product": "purple one on this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"17.47"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$17.47"
|
|
},
|
|
"intent_template_id": 19,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 61,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/bedding/decorative-pillows-inserts-covers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the pink one in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "pink one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"26.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$26.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 62,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the yellow item in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "yellow item",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"10.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$10.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 63,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the purple one in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "purple one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"18.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$18.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 64,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the green one in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "green one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"25.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$25.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 65,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/playstation-4/accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the blue one in the first row.",
|
|
"instantiation_dict": {
|
|
"product": "blue one",
|
|
"location": "first row"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"16.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$16.99"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 66,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "being disappointed",
|
|
"product": "first red and yellow product"
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention being disappointed for the first red and yellow product",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"John",
|
|
"Vini C",
|
|
"Amazon Customer",
|
|
"Katie Switalski",
|
|
"Catherine L."
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "John, Vini C, Amazon Customer, Katie Switalski, Catherine L."
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 67,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/hair-care/hair-coloring-products.html",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "'dark'",
|
|
"product": "second product in the first row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention 'dark' for the second product in the first row",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"jakeanielsen",
|
|
"Jessie Mora",
|
|
"Loyal AmazonianLoyal Amazonian"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "jakeanielsen, Jessie Mora, Loyal AmazonianLoyal Amazonian"
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 68,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "'disgust'",
|
|
"product": "purple product"
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention 'disgust' for the purple product",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Maria A.",
|
|
"Amazon CustomerAmazon Customer"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Maria A., Amazon CustomerAmazon Customer"
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 69,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "'hot'",
|
|
"product": "item in black packaging"
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention 'hot' for the item in black packaging",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Prodajr"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Prodajr"
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 70,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/bedding/decorative-pillows-inserts-covers.html",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "'cute'",
|
|
"product": "pink thing"
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention 'cute' for the pink thing",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Lou HS",
|
|
"Mrs. Renfro"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Lou HS, Mrs. Renfro"
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 71,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/playstation-4/accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "List out reviewers, if exist, who mention {{description}} for the {{product}}",
|
|
"instantiation_dict": {
|
|
"description": "malfunctioning",
|
|
"product": "item with the black and white graphic design"
|
|
},
|
|
"intent": "List out reviewers, if exist, who mention malfunctioning for the item with the black and white graphic design",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no reviews on this item.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 20,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 72,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/mens-sweatpants-halloween-pumpkin-face-sport-pants-joggers-pants-soft-casual-pants.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this to my cart if {{condition}}",
|
|
"instantiation_dict": {
|
|
"condition": "it comes in orange"
|
|
},
|
|
"intent": "Add this to my cart if it comes in orange",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Mens Sweatpants Halloween Pumpkin Face Sport Pants Joggers Pants Soft Casual Pants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 21,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 73,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/kangol-men-s-formal-sock-3-pack.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this to my cart if {{condition}}",
|
|
"instantiation_dict": {
|
|
"condition": "it comes in red"
|
|
},
|
|
"intent": "Add this to my cart if it comes in red",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Kangol Men's Formal Sock, 3 Pack"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 21,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 74,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/wieco-art-sunflower-by-vincent-van-gogh-oil-paintings-reproduction-modern-floral-giclee-canvas-prints-artwork-flowers-pictures-on-canvas-wall-art-for-home-and-office-decorations.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this to my cart if {{condition}}",
|
|
"instantiation_dict": {
|
|
"condition": "it is yellow"
|
|
},
|
|
"intent": "Add this to my cart if it is yellow",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wieco Art Sunflower by Vincent Van Gogh"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 21,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 75,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/car-vehicle-electronics/car-electronics.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the first product in the second row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "first product",
|
|
"location": "second row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Amzparts 6.5\" MIB Car Radio Stereo 19D 035 280 Carplay Mirrorlink BT USB AUX For Volkswagen Bora T-ROC Sportsvan Touran L"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 76,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/novelty-more.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the last product in the last row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "last product",
|
|
"location": "last row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"INTIMO Elf The Movie Men's Cotton Headed Ninny Muggins Allover Holiday Christmas Film Loungewear Pajama Pants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 77,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/patio-furniture-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the third product in the first row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "third product",
|
|
"location": "first row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Synthetic Rattan Woven Material, Plastic Rattan Furniture for Weaving and Repairing Tables and Chairs, Storage Basket, Ect (500 G)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 78,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/living-room-furniture.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the {{product}} in the {{location}} to my wish list.",
|
|
"intent": "Add the first product in the last row to my wish list.",
|
|
"instantiation_dict": {
|
|
"product": "first product",
|
|
"location": "last row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"HIFIT End Table Set of 2, Narrow Side Table with Drawers, Flip Top End Side Table with Storage for Small Space, Bedside Table for Living Room Bedroom, Dark Brown"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 12,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 79,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/video-projectors.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"intent": "What is the price range for products in the second row?",
|
|
"instantiation_dict": {
|
|
"region": "second row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"55.98",
|
|
"624.28"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$55.98 - $624.28"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 80,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/basic-cases.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"intent": "What is the price range for products in the last row?",
|
|
"instantiation_dict": {
|
|
"region": "last row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"9.99",
|
|
"14.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$9.99 - $14.99"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 81,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/health-care.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the price range for products in the {{region}}?",
|
|
"intent": "What is the price range for products in the first row?",
|
|
"instantiation_dict": {
|
|
"region": "first row"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"13.12",
|
|
"72.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$13.12 - $72.99"
|
|
},
|
|
"intent_template_id": 4,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 82,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/alaza-cartoon-pineapple-stripe-house-fleece-slippers-comfy-bedroom-shoes-anti-slip-for-men-us-9-10.html |AND| __SHOPPING__/reef-men-s-twinpin-prints-sandals.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the product that {{attribute}} from my open tabs to the shopping cart",
|
|
"instantiation_dict": {
|
|
"attribute": "is darker in color"
|
|
},
|
|
"intent": "Add the product that is darker in color from my open tabs to the shopping cart",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Reef Men's Twinpin"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 22,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 83,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/adidas-originals-mens-geodiver-primeblue-athletic-and-training-shoes-orange.html |AND| __SHOPPING__/marc-joseph-new-york-mens-lightweight-fashion-slip-on-sockless-sneakers-non-slip-breathable-comfortable-walking-athletic-sports-shoes.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the product that {{attribute}} from my open tabs to the shopping cart",
|
|
"instantiation_dict": {
|
|
"attribute": "is brighter in color"
|
|
},
|
|
"intent": "Add the product that is brighter in color from my open tabs to the shopping cart",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"adidas Originals Mens Geodiver Primeblue Athletic and Training Shoes Orange"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 22,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 84,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/love-live-quote-art-wall-canvas-painting-dream-art-picture-black-white-print-and-poster-for-living-room-home-decor-70x100cm-3pcs-frameless.html |AND| __SHOPPING__/pittsburgh-pa-skyline-blue-by-michael-tompsett-16x24-inch-canvas-wall-art.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the product that {{attribute}} from my open tabs to the shopping cart",
|
|
"instantiation_dict": {
|
|
"attribute": "is most colorful"
|
|
},
|
|
"intent": "Add the product that is most colorful from my open tabs to the shopping cart",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Pittsburgh PA Skyline Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 22,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 85,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-book-stand-tree-shaped-bookshelf-on-the-table-simple-student-shelf-bookcase-storage-shelf-organizer.html |AND| __SHOPPING__/home-bookshelf-bookcase-shelf-bookshelf-book-shelves-simple-student-desktop-small-picture-book-storage-household-simple-floor-living-room-children-s-bookcase-durable-bookcase-display-shelf-storage-org.html |AND| __SHOPPING__/lorell-6-shelf-panel-bookcase-36-x-12-x-72-mahogany.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add the product that {{attribute}} from my open tabs to the shopping cart",
|
|
"instantiation_dict": {
|
|
"attribute": "looks like an animal"
|
|
},
|
|
"intent": "Add the product that looks like an animal from my open tabs to the shopping cart",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Home Bookshelf Bookcase Shelf Bookshelf"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 22,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 86,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add all the items I need to make this to my shopping cart.",
|
|
"intent": "Add all the items I need to make this to my shopping cart.",
|
|
"image": "coco_images/000000024567.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"hot dog",
|
|
"roll |OR| rolls |OR| bun"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 23,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 87,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add all the items I need to make this to my shopping cart.",
|
|
"intent": "Add all the items I need to make this to my shopping cart.",
|
|
"image": "coco_images/000000029675.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"hot dog",
|
|
"roll |OR| rolls |OR| bun",
|
|
"mustard"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 23,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 88,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{item}}, but {{attribute}}, from this page to my wish list.",
|
|
"intent": "Add something like the shirt the person on the right is wearing, but in green, from this page to my wish list.",
|
|
"image": "coco_images/000000048396.jpg",
|
|
"instantiation_dict": {
|
|
"item": "the shirt the person on the right is wearing",
|
|
"attribute": "in green"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Men & Boy Long Sleeve Flannel Plaid Casual Shirts Button Down Regular Fit Long Sleeve Cotton Polo Shirt L-5XL"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 24,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 89,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like the {{item}} to my shopping cart.",
|
|
"intent": "Add something like the thing at the top of this image to my shopping cart.",
|
|
"image": "coco_images/000000064574.jpg",
|
|
"instantiation_dict": {
|
|
"item": "thing at the top of this image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"hair brush"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 25,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 90,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like the {{item}} to my shopping cart.",
|
|
"intent": "Add something like the colorful thing in the sky to my shopping cart.",
|
|
"image": "coco_images/000000433515.jpg",
|
|
"instantiation_dict": {
|
|
"item": "colorful thing in the sky"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no kites available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 25,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 91,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like the {{item}} to my shopping cart.",
|
|
"intent": "Add something like the thing the person is carrying (in the same color) to my shopping cart.",
|
|
"image": "coco_images/000000329041.jpg",
|
|
"instantiation_dict": {
|
|
"item": "thing the person is carrying (in the same color)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no red purses available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 25,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 92,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like the {{item}} to my shopping cart.",
|
|
"intent": "Add something like the blue one to my shopping cart.",
|
|
"image": "coco_images/000000440507.jpg",
|
|
"instantiation_dict": {
|
|
"item": "blue one"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no luggages available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 25,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 93,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like the {{item}} to my shopping cart.",
|
|
"intent": "Add something like the one in the bottom right to my shopping cart.",
|
|
"image": "coco_images/000000324715.jpg",
|
|
"instantiation_dict": {
|
|
"item": "one in the bottom right"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"scissors"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 25,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 94,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "I like {{attribute}}. Can you add something like that {{condition}} to my wishlist, if there's one?",
|
|
"intent": "I like what the person on the left is wearing. Can you add something like that from this page to my wishlist, if there's one?",
|
|
"image": "coco_images/000000066771.jpg",
|
|
"instantiation_dict": {
|
|
"attribute": "what the person on the left is wearing",
|
|
"condition": "from this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"IZOD Men's Advantage Performance Full Zip Fleece Jacket"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 26,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 95,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=necktie&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "I like {{attribute}}. Can you add something like that {{condition}} to my wishlist, if there's one?",
|
|
"intent": "I like this person's outfit. Can you add something like that from this page in the same colors to my wishlist, if there's one?",
|
|
"image": "coco_images/000000163682.jpg",
|
|
"instantiation_dict": {
|
|
"attribute": "this person's outfit",
|
|
"condition": "from this page in the same colors"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Barry.Wang Men's Ties Set Silk Wedding Neckties Woven Silk Formal Business Casual(4/6/8PCS) |OR| Dress Shirts for Men Slim Fit, Classic Long Sleeve Solid Button Down Business Dress Shirt Wedding Party Top"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 26,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 96,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"intent": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"image": "coco_images/000000167240.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"vase"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 27,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 97,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"intent": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"image": "coco_images/000000176232.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"vase |OR| flower"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 27,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 98,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"intent": "I need something like this for my apartment. Can you add one to my wishlist?",
|
|
"image": "coco_images/000000167353.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"clock"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 27,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 99,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-furniture-lighting/chairs-sofas.html?product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "I really like the {{item}}, but I'm not a fan of the color. Can you see if there's one in {{attribute}} on this page, and if so, add the cheapest one to my wishlist?",
|
|
"intent": "I really like the purple item, but I'm not a fan of the color. Can you see if there's one in brown on this page, and if so, add the cheapest one to my wishlist?",
|
|
"image": "coco_images/000000172595.jpg",
|
|
"instantiation_dict": {
|
|
"item": "purple item",
|
|
"attribute": "brown"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Big and Tall Office Chair Executive Chair Wide Seat High Back Ergonomic Computer Chair Home Office Desk Chair Heavy Duty PU Leather Task Chair with Lumbar Support Arms, Brown"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 28,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 100,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add one to my wishlist?",
|
|
"intent": "I like the shirt this person is wearing, can you add one to my wishlist?",
|
|
"image": "coco_images/000000173008.jpg",
|
|
"instantiation_dict": {
|
|
"description": "I like the shirt this person is wearing"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"hawaiian"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 29,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 101,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add one to my wishlist?",
|
|
"intent": "I'd like to hang this on my christmas tree too, can you add one to my wishlist?",
|
|
"image": "coco_images/000000175443.jpg",
|
|
"instantiation_dict": {
|
|
"description": "I'd like to hang this on my christmas tree too"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"teddy"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 29,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 102,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add one to my wishlist?",
|
|
"intent": "I need one of what its wearing for the winter, can you add one to my wishlist?",
|
|
"image": "coco_images/000000286708.jpg",
|
|
"instantiation_dict": {
|
|
"description": "I need one of what its wearing for the winter"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"beanie"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 29,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 103,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add one to my wishlist?",
|
|
"intent": "This looks fun and I'd like to buy this system too, can you add one to my wishlist?",
|
|
"image": "coco_images/000000324258.jpg",
|
|
"instantiation_dict": {
|
|
"description": "This looks fun and I'd like to buy this system too"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"wii"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 29,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 104,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=2&q=dress",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add the most similar one on this page to my wishlist?",
|
|
"intent": "I love the color and style of this, can you add the most similar one on this page to my wishlist?",
|
|
"image": "coco_images/000000327601.jpg",
|
|
"instantiation_dict": {
|
|
"description": "I love the color and style of this"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ANTS Women's Simple Short Bridesmaid Dress Chiffon Homecoming Dresses"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 30,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 105,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/shoes.html?product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add the most similar one on this page to my wishlist?",
|
|
"intent": "The material of this looks quite good, can you add the most similar one on this page to my wishlist?",
|
|
"image": "coco_images/000000399655.jpg",
|
|
"instantiation_dict": {
|
|
"description": "The material of this looks quite good"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Cole Haan Men's Lionel Dress Chukka Boot |OR| MBT Men's Kabisa Laceup Shoe |OR| Donald J Pliner Men's Loafer, Black, 10"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 30,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 106,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html",
|
|
"geolocation": null,
|
|
"intent_template": "{{description}}, can you add the most similar one on this page to my wishlist?",
|
|
"intent": "I like this painting, can you add the most similar one on this page to my wishlist?",
|
|
"image": "coco_images/000000415238.jpg",
|
|
"instantiation_dict": {
|
|
"description": "I like this painting"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wieco Art Sunflower by Vincent Van Gogh Oil Paintings Reproduction Modern Floral Giclee Canvas Prints Artwork Flowers Pictures on Canvas Wall Art for Home and Office Decorations |OR| African American Canvas Wall Art Black Woman With Butterflies Paintings Sexy Black arounded by Sunflower Canvas Paintings Afro Women Picture Black Queen Inspirational Wall Art Hanging Poster Painting Black Girl Photography Abstract Watercolor Sunflower Pa"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 30,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 107,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "I need something to store {{item}}. Add one to my shopping cart.",
|
|
"intent": "I need something to store the item on the right. Add one to my shopping cart.",
|
|
"image": "coco_images/000000444275.jpg",
|
|
"instantiation_dict": {
|
|
"item": "the item on the right"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"microwave",
|
|
"storage |OR| shelf |OR| rack"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 31,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "__SHOPPING__/xxjf-microwave-rack-stainless-steel-2-tier-microwave-oven-rack-kitchen-storage-organiser-cabinet-printer-shelf-bakers-rack.html",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 108,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{attribute}} to my wish list.",
|
|
"intent": "Add something like what the man is wearing to my wish list.",
|
|
"image": "coco_images/000000024567.jpg",
|
|
"instantiation_dict": {
|
|
"attribute": "what the man is wearing"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "__SHOPPING__/wishlist/",
|
|
"eval_image_class": ".products-grid .wishlist .product-image-photo",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a polo shirt? (yes/no)",
|
|
"answer": "yes"
|
|
},
|
|
{
|
|
"question": "Is this shirt green? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 32,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 109,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{items}} to the comparison page?",
|
|
"intent": "Can you add these items to the comparison page?",
|
|
"image": "coco_images/000000348012.jpg",
|
|
"instantiation_dict": {
|
|
"items": "these items"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/catalog/product_compare",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"scissors",
|
|
"tape"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 33,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 110,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Smartwatch Accessories\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B09CGLFYKT.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Smartwatch Accessories"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Fullmosa Compatible with Apple Watch Band 44mm with Bumper Case, Rugged iWatch Band with Screen Protector Only for Apple Watch Series 6/5/4/SE, Orange"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 111,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Herbs, Spices & Seasonings\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B00LSYQ87G.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Herbs, Spices & Seasonings"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Lawry's Chipotle Cinnamon Rub, 27 oz - One 27 Ounce Container of Chipotle Cinnamon Rub Made of Chipotle Chili Pepper, Cinnamon, and Paprika Perfect for Burgers, Pork, Chicken, and Vegetables"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 112,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Dining & Entertaining\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B01M0HT1AW.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Dining & Entertaining"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Reston Lloyd Plastic Tumbler Corelle Coordinates, Timber Shadows, 8oz Acrylic Drinkware, Set of 6, Juice, Clear"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 113,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Women Accessories\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B093YS65BV.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Women Accessories"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Set of 2 Mesh Laundry Bags Cute Orange Cat-1 Medium & 1 Small Bags Laundry,Blouse, Hosiery, Stocking, Underwear, Bra Lingerie, Travel Laundry Bag(8rp9k)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, need to paginate to second page",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 114,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Makeup\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B08GHD7MWP.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Makeup"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Petansy 3 Packs Aloe Vera Lipstick , Lips Moisturizer Long Lasting Nutritious Lip Balm Magic Temperature Color Change Lip Gloss-Set(A)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 115,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my shopping cart. I think it is in the \"{{category}}\" category.",
|
|
"intent": "Add this exact product to my shopping cart. I think it is in the \"Patio Furniture & Accessories\" category.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B07CZHLNS2.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Patio Furniture & Accessories"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Modway EEI-2923-GRY-GRY Aura Outdoor Patio Wicker Rattan Sofa Gray"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 34,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, need to paginate to second page",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 116,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my wish list. I think it might be in the \"{{category}}\" category but I'm not certain.",
|
|
"intent": "Add this exact product to my wish list. I think it might be in the \"PlayStation 4\" category but I'm not certain.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B075LFHQCV.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "PlayStation 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Nintendo Switch Pro Controller Xenoblade 2 Edition (Japan Import)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 35,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, product is actually in the Nintendo Switch category",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 117,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my wish list. I think it might be in the \"{{category}}\" category but I'm not certain.",
|
|
"intent": "Add this exact product to my wish list. I think it might be in the \"Office Furniture & Lighting > Chairs & Sofas\" category but I'm not certain.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B00QGY0PQS.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Office Furniture & Lighting > Chairs & Sofas"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Flash Furniture Low Back Designer Armless White Ribbed Swivel Task Office Chair"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 35,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, product is actually in the Home > Home & Kitchen > Furniture > Home Office Furniture category",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 118,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my wish list. I think it might be in the \"{{category}}\" category but I'm not certain.",
|
|
"intent": "Add this exact product to my wish list. I think it might be in the \"Men > Clothing\" category but I'm not certain.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B096YB95CB.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Men > Clothing"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"INTIMO Elf The Movie Men's Cotton Headed Ninny Muggins Allover Holiday Christmas Film Loungewear Pajama Pants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 35,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, product is actually in the Novelty & More category",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 119,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my wish list. I think it might be in the \"{{category}}\" category but I'm not certain.",
|
|
"intent": "Add this exact product to my wish list. I think it might be in the \"Home D\u00e9cor Products\" category but I'm not certain.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B08LD6T579.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Home D\u00e9cor Products"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ELUZE 4-Light Bathroom Vanity Light Black Vintage Bathroom Lighting with Clear Glass Shades Wall Sconce Lighting Fixtures for Bathroom Kitchen Hallway"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 35,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, product is actually in the Lighting & Ceiling Fans category",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 120,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add this exact product to my wish list. I think it might be in the \"{{category}}\" category but I'm not certain.",
|
|
"intent": "Add this exact product to my wish list. I think it might be in the \"Home D\u00e9cor Products\" category but I'm not certain.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B08Y7N7Z7V.0.jpg",
|
|
"instantiation_dict": {
|
|
"category": "Home D\u00e9cor Products"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Dutsekk LED Bathroom Mirror Anti-Fog - 36x28 Inch Dimmable IP44 Waterproof Bathroom Mirror with Lights - Lighted Bathroom Vanity Mirror for Wall with CCT Adjustable for Makeup"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 35,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image, product is actually in the Bathroom Accessories category",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 121,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B06XKJNJJZ.0.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"501.25"
|
|
]
|
|
},
|
|
"reference_url": "__SHOPPING__/sandisk-extreme-pro-512-gb-cfast-card-model-sdcfsp-512g-a46d.html",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$501.25"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 122,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B07TZD4H27.0.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"126.65"
|
|
]
|
|
},
|
|
"reference_url": "__SHOPPING__/martha-stewart-herbal-botany-wall-art-living-room-decor-floral-linen-canvas-home-accent-country-lifestyle-bathroom-decoration-ready-to-hang-poster-painting-for-bedroom-17-84-x-21-84-green.html",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$126.65"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 123,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B08TC17K6D.0.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"328.77"
|
|
]
|
|
},
|
|
"reference_url": "__SHOPPING__/skyinbags-hand-painted-abstract-plant-tree-oil-painting-on-canvas-large-picture-wall-artwork-modern-art-poster-decoration-for-corridor-live-room-home-decor-gift-90x130cm-unframed9.html",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$328.77"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 124,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B002IVVD4G.0.jpg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"645.00"
|
|
]
|
|
},
|
|
"reference_url": "__SHOPPING__/nec-np4100-6200-lumen-xga-dlp-projector.html",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$645.00"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 125,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "https://images.pexels.com/photos/1152077/pexels-photo-1152077.jpeg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This exact item is not available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 126,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"intent": "Tell me how much this exact item costs on OneStopMarket.",
|
|
"image": "https://images.pexels.com/photos/904620/pexels-photo-904620.jpeg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This exact item does is not available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 36,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to process exact image",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 127,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the ugly christmas sweater. Can you return an image link showing how it looks like from the back?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "ugly christmas sweater",
|
|
"image_desc": "how it looks like from the back"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B00NIN2O28.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B00NIN2O28.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "hard: need to process image, look at images on the product page",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 128,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/clothing.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the nightmare before christmas sweatshirt. Can you return an image link showing how it looks like from the back?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "nightmare before christmas sweatshirt",
|
|
"image_desc": "how it looks like from the back"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an image does not exist on the page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "hard: need to process image, look at images on the product page",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 129,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/flip-cases.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the pink case. Can you return an image link showing how it looks like from the back?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "pink case",
|
|
"image_desc": "how it looks like from the back"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an image does not exist on the page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "hard: need to process image, look at images on the product page",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 130,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/clothing.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the pink hoodie. Can you return an image link showing how it looks like from the back?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "pink hoodie",
|
|
"image_desc": "how it looks like from the back"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B073ZB2V56.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B073ZB2V56.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 131,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/living-room-furniture.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the coffee table in the first row. Can you return an image link showing how the material looks like close up?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "coffee table in the first row",
|
|
"image_desc": "how the material looks like close up"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09KX1J3KW.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09KX1J3KW.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 132,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/patio-furniture-accessories.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the colorful item in the first row. Can you return an image link showing how it might look if I put my feet up on it?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "colorful item in the first row",
|
|
"image_desc": "how it might look if I put my feet up on it"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07Q7PLPKN.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07Q7PLPKN.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 133,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the colorful item in the first row. Can you return an image link showing how it might look when worn?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "colorful item in the first row",
|
|
"image_desc": "how it might look when worn"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09PF55P17.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09PF55P17.0.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 134,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/sports.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the boots in the first row. Can you return an image link showing how it might look when worn?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "boots in the first row",
|
|
"image_desc": "how it might look when worn"
|
|
},
|
|
"require_reset": false,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09P1CJTD9.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09P1CJTD9.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 135,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/schlumbergera-hybrid-zygocactus-christmas-cactus-plant-3-5-inch-pot-1-plant.html",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link of an image showing how this item looks like {{attribute}}.",
|
|
"intent": "Return an image link of an image showing how this item looks like when it is flowering.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"attribute": "when it is flowering"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07W88SQCT.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07W88SQCT.0.jpg"
|
|
},
|
|
"intent_template_id": 38,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 136,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/ambesonne-japanese-duvet-cover-set-japanese-traditional-garden-design-wildlife-forest-meditation-origami-decorative-3-piece-bedding-set-with-2-pillow-shams-queen-size-black-and-white.html",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link of an image showing how this item looks like {{attribute}}.",
|
|
"intent": "Return an image link of an image showing how this item looks like from above.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"attribute": "from above"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B073Q36J45.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B073Q36J45.0.jpg"
|
|
},
|
|
"intent_template_id": 38,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 137,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link of {{item}}.",
|
|
"intent": "Return an image link of the cheapest Canon printer from the \"Printers & Accessories\" category which shows it printing something.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "the cheapest Canon printer from the \"Printers & Accessories\" category which shows it printing something"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B005TI2Q6O.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B005TI2Q6O.0.jpg"
|
|
},
|
|
"intent_template_id": 39,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 138,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/gardening-lawn-care/plants-seeds-bulbs.html",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link of {{item}}.",
|
|
"intent": "Return an image link of the most highly reviewed item on this page.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "the most highly reviewed item on this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07SSFGC5S.0.jpg |OR| B07SSFGC5S.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07SSFGC5S.0.jpg"
|
|
},
|
|
"intent_template_id": 39,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 139,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link from one of the products here showing {{item}}.",
|
|
"intent": "Return an image link from one of the products here showing a close up of some cookies, if it exists.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "a close up of some cookies, if it exists"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B08FP4B8N9.1.jpg |OR| B07GD7RHMV.1.jpg |OR| B0719MJ5H7.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B08FP4B8N9.1.jpg"
|
|
},
|
|
"intent_template_id": 40,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 140,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/oral-care/toothbrushes-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "Return an image link from one of the products here showing {{item}}.",
|
|
"intent": "Return an image link from one of the products here showing a single blue toothbrush, if it exists.",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "a single blue toothbrush, if it exists"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B086LJX6TL.1.jpg |OR| B009OCJBN2.0.jpg |OR| B009OCJBN2.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B086LJX6TL.1.jpg"
|
|
},
|
|
"intent_template_id": 40,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 141,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/oral-care/toothbrushes-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "The panda toothbrush box is cute, can you return an image link showing the design with other animals if possible?",
|
|
"intent": "The panda toothbrush box is cute, can you return an image link showing the design with other animals if possible?",
|
|
"image": null,
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09BCV4NS1.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09BCV4NS1.1.jpg"
|
|
},
|
|
"intent_template_id": 41,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 142,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/xbox-one.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'm interested in the {{item}}. Can you return an image link showing {{image_desc}}?",
|
|
"intent": "I'm interested in the cheaper pink controller. Can you return an image link showing how it looks like from another angle?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "cheaper pink controller",
|
|
"image_desc": "how it looks like from another angle"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07Q4R3X1B.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07Q4R3X1B.1.jpg or __SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B074W9FQC2.1.jpg"
|
|
},
|
|
"intent_template_id": 37,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 143,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/skin-care/face.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'd like to share the {{item}} with my friend, can you return an image link {{description}}?",
|
|
"intent": "I'd like to share the third item with my friend, can you return an image link of an image summarizing its benefits?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "third item",
|
|
"description": "of an image summarizing its benefits"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07YZTN7TX.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07YZTN7TX.1.jpg"
|
|
},
|
|
"intent_template_id": 42,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "need to do OCR",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 144,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/living-room-furniture.html",
|
|
"geolocation": null,
|
|
"intent_template": "I'd like to share the {{item}} with my friend, can you return an image link {{description}}?",
|
|
"intent": "I'd like to share the second item with my friend, can you return an image link without the TV (just the stand)?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"item": "second item",
|
|
"description": "without the TV (just the stand)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07MG5G5B5.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07MG5G5B5.1.jpg"
|
|
},
|
|
"intent_template_id": 42,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 145,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/outdoor-patio-folding-side-table-square-metal-end-table-portable-small-bistro-coffee-table-green.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return the link of an image {{description}}?",
|
|
"intent": "Can you return the link of an image highlighting the features of this table?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"description": "highlighting the features of this table"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07FM3WKJ8.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07FM3WKJ8.1.jpg"
|
|
},
|
|
"intent_template_id": 43,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 146,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/milwaukee-pretzel-company-authentic-bavarian-style-gourmet-soft-pretzel-fresh-baked-and-shipped-16-oz-1-lb-bavarian-beast-pretzel-pack-of-2.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return the link of an image {{description}}?",
|
|
"intent": "Can you return the link of an image illustrating the dimensions of the pretzel?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"description": "illustrating the dimensions of the pretzel"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B079B43M9T.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B079B43M9T.1.jpg"
|
|
},
|
|
"intent_template_id": 43,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 147,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/crestlive-products-dresser-storage-drawer-organizer-fabric-dresser-for-bedroom-living-room-entryway-closets-easy-pull-fabric-bins-wood-top-mixed-color.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return the link of an image {{description}}?",
|
|
"intent": "Can you return the link of an image illustrating the dimensions of the dresser?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"description": "illustrating the dimensions of the dresser"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an image does not exist on the page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 43,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 148,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/dave-s-killer-bread-good-seed-4-loaves-usda-organic.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return the link of an image {{description}}?",
|
|
"intent": "Can you return the link of an image showing a close up of the bread (without the packaging)?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"description": "showing a close up of the bread (without the packaging)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an image does not exist on the page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 43,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 149,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/dave-s-killer-bread-good-seed-4-loaves-usda-organic.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return the link of an image {{description}}?",
|
|
"intent": "Can you return the link of an image showing the nutritional information of this?",
|
|
"image": null,
|
|
"instantiation_dict": {
|
|
"description": "showing the nutritional information of this"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B00U10YS7K.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B00U10YS7K.1.jpg"
|
|
},
|
|
"intent_template_id": 43,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 150,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"intent": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"image": "https://images.pexels.com/photos/12021852/pexels-photo-12021852.jpeg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sales/order/view/order_id/161/",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 44,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "hard",
|
|
"comments": "pg1. __SHOPPING__/wangliwer-mini-wireless-bluetooth-speaker-with-mic-tf-card-metal-portable-subwoof-sound-fm-radio-aux-mp3-music-plays-loudspeaker-portable-speaker-color-pink.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 151,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"intent": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"image": "https://images.pexels.com/photos/932638/pexels-photo-932638.jpeg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sales/order/view/order_id/157/",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 44,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "hard",
|
|
"comments": "pg1. __SHOPPING__/photo-backgrounds-blue-sea-background-for-shiny-underwater-photography-pea-bulb-scenic-party-decor-photo-decorations-photocall-photo-studio-5x3ft.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 152,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"intent": "I remembered that I ordered something like this, can you show me the corresponding order page?",
|
|
"image": "https://images.pexels.com/photos/18541045/pexels-photo-18541045/free-photo-of-standing-giraffes-in-glass-lens-filter.jpeg",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sales/order/view/order_id/165/",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 44,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "pg3. __SHOPPING__/37mm-cpl-polarizing-lens-filter-portable-polarizer-camera-lens-mobile-phone-clip-designed-polarizer-lens-filter-improve-color-saturation-and-contrast-for-eliminating-or-reducing-light-spots.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 153,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} of the same brand as the product in this picture.",
|
|
"intent": "Find me a game console of the same brand as the product in this picture.",
|
|
"image": "https://images.pexels.com/photos/5626726/pexels-photo-5626726.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"category": "a game console"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'manufacturer |OR| brand name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Microsoft"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a game console? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 45,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/microsoft-xbox-one-console-with-accessories-1tb-hdd-black.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 154,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} of the same brand as the product in this picture.",
|
|
"intent": "Find me a set of headphones of the same brand as the product in this picture.",
|
|
"image": "https://images.pexels.com/photos/45889/camera-photo-camera-sony-alpha-7-sony-45889.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a set of headphones"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'manufacturer |OR| brand name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Sony"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a headphone? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 45,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 155,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} of the same brand as the product in this picture. It needs to {{description}}.",
|
|
"intent": "Find me a set of headphones of the same brand as the product in this picture. It needs to be silver colored and have at least 10 reviews with an average rating greater than 4.",
|
|
"image": "https://images.pexels.com/photos/1528851/pexels-photo-1528851.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a set of headphones",
|
|
"description": "be silver colored and have at least 10 reviews with an average rating greater than 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sony-wh1000xm3-bluetooth-wireless-noise-canceling-headphones-silver-wh-1000xm3-s-renewed.html |OR| __SHOPPING__/sony-h900n-hi-res-noise-cancelling-wireless-headphone-grayish-black-renewed.html |OR| __SHOPPING__/sony-mdrx10-red-simon-cowell-x-headphones-with-50mm-diaphragms.html",
|
|
"program_html": [],
|
|
"url_note": "GOLD in PRED"
|
|
},
|
|
"intent_template_id": 46,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 156,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} of the same brand as the product in this picture. It needs to {{description}}.",
|
|
"intent": "Find me a printer of the same brand as the product in this picture. It needs to be white and have at least 11 reviews with an average rating greater than 4.",
|
|
"image": "https://images.pexels.com/photos/7639358/pexels-photo-7639358.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a printer",
|
|
"description": "be white and have at least 11 reviews with an average rating greater than 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/hp-deskjet-f380-all-in-one-printer-scanner-copier.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 46,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 157,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} of the same brand as the product in this picture. It needs to {{description}}.",
|
|
"intent": "Find me protein bars of the same brand as the product in this picture. It needs to have price between $30 and $50.",
|
|
"image": "https://images.pexels.com/photos/12709747/pexels-photo-12709747.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"category": "protein bars",
|
|
"description": "have price between $30 and $50"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/kellogg-s-special-k-protein-bars-meal-replacement-protein-snacks-value-size-chocolatey-chip-cookie-dough-19oz-box-12-bars.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 46,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 158,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as products in one of the following pictures. It needs to {{description}}.",
|
|
"intent": "Find me a digital camera that is of the same brand as products in one of the following pictures. It needs to be black and have at least 12 reviews. Furthermore, it cannot be too expensive - it needs to have price less than $700.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/1022187/pexels-photo-1022187.jpeg",
|
|
"https://images.pexels.com/photos/89551/pexels-photo-89551.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a digital camera",
|
|
"description": "be black and have at least 12 reviews. Furthermore, it cannot be too expensive - it needs to have price less than $700"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_num_reviews(__page__)",
|
|
"required_contents": {
|
|
"required_values": [
|
|
">= 12"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_price(__page__)",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"< 700"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'manufacturer |OR| brand name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Olympus |OR| Nikon"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a digital camera? (yes/no)",
|
|
"answer": "yes"
|
|
},
|
|
{
|
|
"question": "Is the color of the product black? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 47,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/olympus-om-d-e-m1-16mp-mirrorless-digital-camera-with-3-inch-lcd-body-only-silver-w-black-trim.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 159,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{attribute}} to my wish list.",
|
|
"intent": "Add something like what the person is covered with in a similar color to my wish list.",
|
|
"image": "https://images.pexels.com/photos/269141/pexels-photo-269141.jpeg",
|
|
"instantiation_dict": {
|
|
"attribute": "what the person is covered with in a similar color"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "__SHOPPING__/wishlist/",
|
|
"eval_image_class": ".products-grid .wishlist .product-image-photo",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a blanket? (yes/no)",
|
|
"answer": "yes"
|
|
},
|
|
{
|
|
"question": "Is this blanket light blue? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 32,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"comments": "__SHOPPING__/wellber-extra-soft-fuzzy-faux-fur-throw-blanket-reversible-decorative-fluffy-sherpa-blanket-lightweight-cozy-microfiber-plush-furry-shaggy-fleece-blanket-for-couch-sofa-bed-50-x60-ice-blue.html",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 160,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{attribute}} to my wish list.",
|
|
"intent": "Add something like what the girl is holding to my wish list.",
|
|
"image": "https://images.pexels.com/photos/5614386/pexels-photo-5614386.jpeg",
|
|
"instantiation_dict": {
|
|
"attribute": "what the girl is holding"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "__SHOPPING__/wishlist/",
|
|
"eval_image_class": ".products-grid .wishlist .product-image-photo",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a cookie? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 32,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 161,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{item}}, but {{attribute}}, from this page to my wish list.",
|
|
"intent": "Add something like the picture shown, but in sketching style, from this page to my wish list.",
|
|
"image": "https://images.pexels.com/photos/1054672/pexels-photo-1054672.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "the picture shown",
|
|
"attribute": "in sketching style"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Yelash Cute Elephant Canvas Wall Art Colorful Dots and Sketch Elephant Picture Print for Kids Room Bathroom Poster Framed Ready to Hang (12\"x16\"x1 Panel)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 24,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "__SHOPPING__/yelash-cute-elephant-canvas-wall-art-colorful-dots-and-sketch-elephant-picture-print-for-kids-room-bathroom-poster-framed-ready-to-hang-12-x16-x1-panel.html",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 162,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/basic-cases.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{item}}, but {{attribute}}, from this page to my wish list.",
|
|
"intent": "Add something like what is used to protect the phone in the picture, but one with a ring kickstand, from this page to my wish list.",
|
|
"image": "https://images.pexels.com/photos/3392232/pexels-photo-3392232.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "what is used to protect the phone in the picture",
|
|
"attribute": "one with a ring kickstand"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"KSELF for iPhone 11 Case with [2 Pack] Tempered Glass Screen Protector, Hard PC Slim Cover with Ring Kickstand, Full Protective Shockproof Dual Layer Hybrid Bumper Case for iPhone 11 6.1 inch (Blue)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 24,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/kself-for-iphone-11-case-with-2-pack-tempered-glass-screen-protector-hard-pc-slim-cover-with-ring-kickstand-full-protective-shockproof-dual-layer-hybrid-bumper-case-for-iphone-11-6-1-inch-blue.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 163,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{attribute}} to my wish list.",
|
|
"intent": "Add something like this to my wish list.",
|
|
"image": "https://images.pexels.com/photos/837267/pexels-photo-837267.jpeg",
|
|
"instantiation_dict": {
|
|
"attribute": "this"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "__SHOPPING__/wishlist/",
|
|
"eval_image_class": ".products-grid .wishlist .product-image-photo",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a cactus? (yes/no)",
|
|
"answer": "yes"
|
|
},
|
|
{
|
|
"question": "Is this a potted plant? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 32,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "__SHOPPING__/artificial-cactus-fake-cactus-16-faux-cacti-plants-for-home-garden-office-store-decoration.html",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 164,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as products in one of the following pictures. It needs to {{description}}.",
|
|
"intent": "Find me a television that is of the same brand as products in one of the following pictures. It needs to have price at least $600.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/1447254/pexels-photo-1447254.jpeg",
|
|
"https://images.pexels.com/photos/3066/smartphone-mockup-mobile-phone-screen.jpg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a television",
|
|
"description": "have price at least $600"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_price(__page__)",
|
|
"required_contents": {
|
|
"required_values": [
|
|
">= 600"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'brand name |OR| manufacturer')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"LG |OR| SAMSUNG"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a television? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 47,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/lg-50nano80upa-50-nanocell-4k-nano80-series-smart-ultra-hd-tv-with-an-lg-sn6y-3-1-channel-dts-virtual-high-resolution-soundbar-and-subwoofer-2021.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 165,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as products in one of the following pictures. It needs to {{description}}.",
|
|
"intent": "Find me a men's tennis shoe that is of the same brand as products in one of the following pictures. It needs to have price between $60 and $120 with at least 11 reviews.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/1383775/pexels-photo-1383775.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/6748322/pexels-photo-6748322.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a men's tennis shoe",
|
|
"description": "have price between $60 and $120 with at least 11 reviews"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_price(__page__)",
|
|
"required_contents": {
|
|
"required_values": [
|
|
">= 60",
|
|
"<= 120"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_num_reviews(__page__)",
|
|
"required_contents": {
|
|
"required_values": [
|
|
">= 11"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'manufacturer |OR| brand name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Asics |OR| Nike"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Men",
|
|
"Tennis Shoe"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 47,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/asics-men-s-gel-resolution-8-tennis-shoes.html, __SHOPPING__/nike-men-s-court-lite-2-tennis-shoe.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 166,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that {{relation1}} first picture and has {{relation2}} second picture. It needs to have {{relation3}} third picture.",
|
|
"intent": "Find me a shoe that is designed for the sport depicted in the first picture and has the same brand as products in the second picture. It needs to have the same color as the flower in the third picture.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/2291004/pexels-photo-2291004.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/3281608/pexels-photo-3281608.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/112398/pexels-photo-112398.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a shoe",
|
|
"relation1": "is designed for the sport depicted in the",
|
|
"relation2": "the same brand as products in the",
|
|
"relation3": "the same color as the flower in the"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_product_attributes(__page__, 'manufacturer |OR| brand name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"adidas"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Basketball",
|
|
"Sneaker |OR| Shoe"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is the shoe red? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 48,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/adidas-mens-harden-be-x-basketball-sneakers-shoes-casual-red.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 167,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that {{relation1}} first picture and has {{relation2}} second picture. It needs to have {{relation3}} third picture.",
|
|
"intent": "Find me a shoe that is designed for the sport depicted in the first picture and has the same brand as products in the second picture. It needs to have the same color as the third picture.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/5739218/pexels-photo-5739218.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/7154759/pexels-photo-7154759.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/4098504/pexels-photo-4098504.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a shoe",
|
|
"relation1": "is designed for the sport depicted in the",
|
|
"relation2": "the same brand as products in the",
|
|
"relation3": "the same color as the"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an item is not available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 48,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 168,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I really like {{stuff}}. Can you find me {{product}} and add it to my shopping cart?",
|
|
"intent": "I really like this drink. Can you find me mochi that have flavor of this drink and add it to my shopping cart?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/6413654/pexels-photo-6413654.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"stuff": "this drink",
|
|
"product": "mochi that have flavor of this drink"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => { try { return Array.from(document.querySelectorAll('.item-info')).find(el => el.textContent.includes('Royal Family 2 Packs of Mini Mochi Individually Wrapped- japenese taiwanese asia sweet rice wagashi snack dessert dagashi candies cake candy drinks daifuku (Bubble Milk Tea, Total 8.4oz)')).querySelector('td.col.item > div > dl > dd').textContent.trim() } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"exact_match": "Bubble Milk Tea"
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 49,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": "__SHOPPING__/royal-family-2-packs-of-mini-mochi-individually-wrapped-japenese-taiwanese-asia-sweet-rice-wagashi-snack-dessert-dagashi-candies-cake-candy-drinks-daifuku-bubble-milk-tea-total-8-4oz.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 169,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you find me {{category}} that combines the {{attribute}} of the items in the following images?",
|
|
"intent": "Can you find me a product that combines the functions of the items in the following images?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/9582658/pexels-photo-9582658.jpeg",
|
|
"https://images.pexels.com/photos/3205735/pexels-photo-3205735.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a product",
|
|
"attribute": "functions"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Clock",
|
|
"Camera"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 50,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/hidden-clock-camera-wifi-hd-1080p-spy-camera-with-night-vision-motion-detection-loop-recording-covert-nanny-cam-for-home-office-surveillance-no-audio.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 170,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you find me {{category}} that combines the {{attributes}} of the items in the following images?",
|
|
"intent": "Can you find me a product that combines the functions of the items in the following images?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/4206091/pexels-photo-4206091.jpeg",
|
|
"https://images.pexels.com/photos/1772123/pexels-photo-1772123.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a product",
|
|
"attributes": "functions"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Projection Keyboard"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 51,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/la-guapa-virtual-projection-keyboard-laser-projection-bluetooth-wireless-keyboard-for-smart-phone-pc-tablet-laptop-wireless-laser-projection-keyboard-silver.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 171,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you find me {{category}} that combines the {{attributes}} of the items in the following images?",
|
|
"intent": "Can you find me a taiwanese snack that combines the flavors of the items in the following images?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/947879/pexels-photo-947879.jpeg",
|
|
"https://images.pexels.com/photos/4110006/pexels-photo-4110006.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a taiwanese snack",
|
|
"attributes": "flavors"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SUNNY HILLS Pineapple Cake"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 51,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/sunny-hills-pineapple-cake-10pcs-500g-best-taiwanese-gift-sunny-hills-fresh-stock-taiwan-food-pineapple-cake.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 172,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I really like {{stuff}}. Can you find me {{product}} and add it to my shopping cart?",
|
|
"intent": "I really like this animal's pattern. Can you find me a queen size bedding set that has the same pattern and add it to my shopping cart?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/39857/leopard-leopard-spots-animal-wild-39857.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"stuff": "this animal's pattern",
|
|
"product": "a queen size bedding set that has the same pattern"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => { try { return Array.from(document.querySelectorAll('.item-info')).find(el => el.textContent.includes('Girls Leopard Print Bedding Set Teens Luxury Pink Black Cheetah Print Bed Sheet Set Twin Size for Kids Children Women Bedroom Decor Fitted Sheet Chic Wild Animal Bed Cover with 1 Pillow Case')).querySelector('td.col.item > div > dl > dd:nth-child(4)').textContent.trim() } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"exact_match": "Queen"
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 49,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": "__SHOPPING__/girls-leopard-print-bedding-set-teens-luxury-pink-black-cheetah-print-bed-sheet-set-twin-size-for-kids-children-women-bedroom-decor-fitted-sheet-chic-wild-animal-bed-cover-with-1-pillow-case.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 173,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I really like {{stuff}}. Can you find me {{product}} and add it to my shopping cart?",
|
|
"intent": "I really like this fruit. Can you find me a 1 fl oz fragrance that has the same smell and add it to my shopping cart?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/209549/pexels-photo-209549.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"stuff": "this fruit",
|
|
"product": "a 1 fl oz fragrance that has the same smell"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => { try { return Array.from(document.querySelectorAll('.item-info')).find(el => el.textContent.includes('Jo Malone Grapefruit Cologne Spray for Women, 1 Ounce')).querySelector('td.col.item > div > dl > dd').textContent.trim() } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"exact_match": "1 Fl Oz (Pack of 1)"
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 49,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": "__SHOPPING__/jo-malone-grapefruit-cologne-spray-for-women-1-ounce.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 174,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you find me {{category}} that combines the {{attributes}} of the items in the following images and buy it for me?",
|
|
"intent": "Can you find me a product that combines the functions of the items in the following images and buy it for me?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/2529147/pexels-photo-2529147.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/244553/pexels-photo-244553.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a product",
|
|
"attributes": "functions"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"roller skate"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 52,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/sxzhsm-roller-skates-for-women-outdoor-parkour-shoes-with-wheels-for-girls-boys-kick-rollers-shoes-retractable-adults-kids-quad-roller-skates-men-unisex-skating-shoes-recreation-sneakers-eu39-white.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 175,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this picture and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a wireless white game controller that is of the same brand as the product in this picture and buy it for me. It needs to have at 10 reviews and be priced between $110-$120.",
|
|
"image": "https://images.pexels.com/photos/8998292/pexels-photo-8998292.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a wireless white game controller",
|
|
"description": "have at 10 reviews and be priced between $110-$120",
|
|
"quantity": "it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07P3L5GMW"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 53,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/xbox-wireless-controller-phantom-white-special-edition.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 176,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this picture and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a black headphone that is of the same brand as the product in this picture and buy it for me. It needs to be priced more than $1000.",
|
|
"image": "https://images.pexels.com/photos/3541365/pexels-photo-3541365.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"category": "a black headphone",
|
|
"description": "be priced more than $1000",
|
|
"quantity": "it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01LD5GO7I"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 53,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/sony-mdr-z1r-ww2-signature-hi-res-headphone-black-international-version.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 177,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this picture and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a headphone that is of the same brand as the product in this picture and buy it for me. It needs to have color sliver and have at least 10 reviews with an average rating greater than 4.",
|
|
"image": "https://images.pexels.com/photos/4219883/pexels-photo-4219883.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a headphone",
|
|
"description": "have color sliver and have at least 10 reviews with an average rating greater than 4",
|
|
"quantity": "it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07J9YNRWF |OR| B07CX6HHFK |OR| B00972M942"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 53,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 178,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this picture and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a multifunction printer (copy/scan/fax/print) that is of the same brand as the product in this picture and buy \ud83d\udd1f of them for me. It needs to have color black and have at least 5 reviews with an average rating greater than 3.",
|
|
"image": "https://images.pexels.com/photos/11129922/pexels-photo-11129922.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "a multifunction printer (copy/scan/fax/print)",
|
|
"quantity": "\ud83d\udd1f of them",
|
|
"description": "have color black and have at least 5 reviews with an average rating greater than 3"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B00PZ9WV94')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 10"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 53,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/hp-cf484a-laserjet-pro-mfp-m225dn-multifunction-laser-printer-copy-fax-print-scan.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 179,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this picture and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me all of the protein bars that is of the same brand as the product in this picture and buy 12 bars of each (at the lowest possible per unit price) for me. It needs to have per unit price between $1.66 and $4.08.",
|
|
"image": "https://images.pexels.com/photos/12538285/pexels-photo-12538285.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "all of the protein bars",
|
|
"quantity": "12 bars of each (at the lowest possible per unit price)",
|
|
"description": "have per unit price between $1.66 and $4.08"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B00MXUFL0E')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 1"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_option(__page__, 'B00MXUFL0E', 'Size')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"12 Count (Pack of 1)"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B07ZD2PB9F')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 1"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 53,
|
|
"reasoning_difficulty": "hrad",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/kellogg-s-special-k-protein-bars-meal-replacement-protein-snacks-value-size-strawberry-19oz-box-12-bars.html, __SHOPPING__/kellogg-s-special-k-protein-bars-meal-replacement-protein-snacks-value-size-chocolatey-chip-cookie-dough-19oz-box-12-bars.html. Per unit price is calculated as listed price divided by 12."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 180,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as products in one of the following pictures and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a digital camera with warranty that is of the same brand as products in one of the following pictures and buy one for me. It needs to be black and have at least 12 reviews. Furthermore, it cannot be too expensive - it needs to have price less than $700.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/6708408/pexels-photo-6708408.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a digital camera with warranty",
|
|
"quantity": "one",
|
|
"description": "be black and have at least 12 reviews. Furthermore, it cannot be too expensive - it needs to have price less than $700"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B001P06Q66')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 1"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 54,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/olympus-sp-590uz-12mp-digital-camera-with-26x-wide-angle-optical-dual-image-stabilized-zoom-and-2-7-inch-lcd-black.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 181,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me something like {{item}}, but {{attribute}}, from this page.",
|
|
"intent": "Buy me something like the picture shown, but in sketching style, from this page.",
|
|
"image": "https://images.pexels.com/photos/3751675/pexels-photo-3751675.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"item": "the picture shown",
|
|
"attribute": "in sketching style"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_option(__page__, 'B091FT6ZJC', 'Color')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Cute Elephant"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 55,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "__SHOPPING__/yelash-cute-elephant-canvas-wall-art-colorful-dots-and-sketch-elephant-picture-print-for-kids-room-bathroom-poster-framed-ready-to-hang-12-x16-x1-panel.html",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 182,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/basic-cases.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me something like {{item}}, but {{attribute}}, from this page.",
|
|
"intent": "Buy me something like what is used to protect the phone in the picture, but one with a soldier figure, from this page.",
|
|
"image": "https://images.pexels.com/photos/374004/pexels-photo-374004.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "what is used to protect the phone in the picture",
|
|
"attribute": "one with a soldier figure"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B095GYK1VZ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 55,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/generic-phone-case-compatible-with-iphone-sebastian-scratch-stan-accessories-the-shock-winter-waterproof-soldier-6-7-8-plus-se-2020-x-xr-11-pro-max-12-mini-transparent.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 183,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as products in one of the following pictures and buy {{quantity}} for me. It needs to {{description}}.",
|
|
"intent": "Find me a \ud83d\udcfa that is of the same brand as products in one of the following pictures and buy 3\ufe0f\u20e3 for me. It needs to have price between $4000 and $10000.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/2942361/pexels-photo-2942361.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/16121799/pexels-photo-16121799/free-photo-of-close-up-of-cellphone.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a \ud83d\udcfa",
|
|
"quantity": "3\ufe0f\u20e3",
|
|
"description": "have price between $4000 and $10000"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B08H5STXXC |OR| B07YGWT3KV |OR| B08X4XCJ4T |OR| B0959NDNJV |OR| B09GMQ72RH |OR| B098KLX2R8')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 3"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 54,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 184,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I really like {{stuff}}. Can you find me {{product}} and buy {{quantity}} for me?",
|
|
"intent": "I really like this drink. Can you find me mochi that have flavor of this drink and buy 4*2 of them for me?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/12187693/pexels-photo-12187693.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"stuff": "this drink",
|
|
"product": "mochi that have flavor of this drink",
|
|
"quantity": "4*2 of them"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B08PHZ6G4J')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 8"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_option(__page__, 'B08PHZ6G4J', 'Flavor Name')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Bubble Milk Tea"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 56,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/royal-family-2-packs-of-mini-mochi-individually-wrapped-japenese-taiwanese-asia-sweet-rice-wagashi-snack-dessert-dagashi-candies-cake-candy-drinks-daifuku-bubble-milk-tea-total-8-4oz.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 185,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I really like {{stuff}}. Can you find me {{product}} and buy {{quantity}} for me?",
|
|
"intent": "I really like this animal's pattern. Can you find me a twin xl size bedding set that have the same pattern and buy two for me?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/267074/pexels-photo-267074.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"stuff": "this animal's pattern",
|
|
"product": "a twin xl size bedding set that have the same pattern",
|
|
"quantity": "two"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__,'B08SQJF7PF')",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 2"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:shopping_get_order_product_option(__page__, 'B08SQJF7PF', 'Size')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Twin XL"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 56,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/girls-leopard-print-bedding-set-teens-luxury-pink-black-cheetah-print-bed-sheet-set-twin-size-for-kids-children-women-bedroom-decor-fitted-sheet-chic-wild-animal-bed-cover-with-1-pillow-case.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 186,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you find me {{category}} that is the combination of the following images and buy it for me?",
|
|
"intent": "Can you find me a sport equipment that is the combination of the following images and buy it for me?",
|
|
"image": [
|
|
"https://images.pexels.com/photos/1537671/pexels-photo-1537671.jpeg",
|
|
"https://images.pexels.com/photos/2883462/pexels-photo-2883462.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"category": "a sport equipment"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector('.order-details-items.ordered').outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"roller skate |OR| cycling shoes |OR| bike shoes |OR| bicycle shoes"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 57,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/sxzhsm-roller-skates-for-women-outdoor-parkour-shoes-with-wheels-for-girls-boys-kick-rollers-shoes-retractable-adults-kids-quad-roller-skates-men-unisex-skating-shoes-recreation-sneakers-eu39-white.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 187,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add the least expensive {{item}} that can hold {{storable}} to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "opaque phone case",
|
|
"storable": "an iPhone X"
|
|
},
|
|
"intent": "Add the least expensive opaque phone case that can hold an iPhone X to my shopping cart.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Asuwish Compatible with iPhone Xs X 10 10s Wallet Case Tempered Glass Screen Protector Leather Flip Cover Card Holder Phone Cases for iPhoneX iPhoneXs iPhone10 i PhoneX SX 10x 10xs X\u2019s Women Men Black"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 58,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 188,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Add the least expensive {{item}} that can hold {{storable}} to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "car",
|
|
"storable": "4 people"
|
|
},
|
|
"intent": "Add the least expensive car that can hold 4 people to my shopping cart.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no cars available on OneStopMarket.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 58,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 189,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{items}} to the comparison page?",
|
|
"instantiation_dict": {
|
|
"items": "the two most expensive fully black VR headsets in the \"Virtual Reality\" category"
|
|
},
|
|
"intent": "Can you add the two most expensive fully black VR headsets in the \"Virtual Reality\" category to the comparison page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/catalog/product_compare",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ZJJY VR Headsets, Virtual Reality Headset, Bluetooth Controller for iPhone 11/Pro/X/Xs/Max/XR/8P/7P,for Samsung S20/S10/S9/S8/Plus/Note 10/9/8,Phones w/ 4.5-6.2in Screen, L025xq",
|
|
"ZNBJJWCP 3D VR Glasses Headset Virtual Reality Goggles Play Movies Photos Enjoyment for Smartphones"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 33,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "Medium visual difficuly because the most expensive headset has some blue lighting effects on it."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 190,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{items}} to the comparison page?",
|
|
"instantiation_dict": {
|
|
"items": "the two most expensive white projectors in the \"Video Projectors\" category"
|
|
},
|
|
"intent": "Can you add the two most expensive white projectors in the \"Video Projectors\" category to the comparison page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/catalog/product_compare",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Samsung Ultra Short Throw Laser Projector - 3840 x 2160 - Front - 20000 Hour Normal Mode4K UHD - 2,000,000:1-2800 lm (Renewed)",
|
|
"Panasonic LCD Projector - 720p - HDTV - 4:3 PT-EX800ZLU"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 33,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 191,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "I've been thinking about ordering {{item}}, but {{condition}}. Can you add it to my shopping cart if it exists?",
|
|
"instantiation_dict": {
|
|
"item": "a donkey planter",
|
|
"condition": "only if it can hold 2 pots"
|
|
},
|
|
"intent": "I've been thinking about ordering a donkey planter, but only if it can hold 2 pots. Can you add it to my shopping cart if it exists?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Design Toscano NG32766 Pancho the Burro Planter Sculpture,full color"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 59,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 192,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/roasemal-back-scrubber-for-shower-silicone-back-scrubber-for-shower-dual-sided-natural-soft-and-stiff-massage-bristles-for-body-exfoliating-purple.html",
|
|
"geolocation": null,
|
|
"intent_template": "What is the width and length of this product in inches? (Not the package size)",
|
|
"instantiation_dict": {},
|
|
"intent": "What is the width and length of this product in inches? (Not the package size)",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"26.77",
|
|
"4.33"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "26.77 in x 4.33 in"
|
|
},
|
|
"intent_template_id": 60,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "Easier to perform OCR on the second image to get the dimensions."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 193,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/accessories.html?p=10",
|
|
"geolocation": null,
|
|
"intent_template": "How much is the {{item}} with {{secondary_item}} in the picture on this page?",
|
|
"instantiation_dict": {
|
|
"item": "VR headset",
|
|
"secondary_item": "a dinosaur"
|
|
},
|
|
"intent": "How much is the VR headset with a dinosaur in the picture on this page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"$63.98"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$63.98"
|
|
},
|
|
"intent_template_id": 61,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 194,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/gardening-lawn-care/pots-planters-container-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "How much is the {{item}} with {{secondary_item}} in the picture on this page?",
|
|
"instantiation_dict": {
|
|
"item": "product",
|
|
"secondary_item": "the most plants"
|
|
},
|
|
"intent": "How much is the product with the most plants in the picture on this page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"$37.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$37.99"
|
|
},
|
|
"intent_template_id": 61,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 195,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/footwear.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "How much is the {{item}} with {{secondary_item}} in the picture on this page?",
|
|
"instantiation_dict": {
|
|
"item": "shoe",
|
|
"secondary_item": "black pants"
|
|
},
|
|
"intent": "How much is the shoe with black pants in the picture on this page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"$26.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$26.99"
|
|
},
|
|
"intent_template_id": 61,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 196,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/food-beverage-gifts/herb-spice-seasoning-gifts.html?product_list_mode=list",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the item {{offset}} the {{item}} to my cart?",
|
|
"instantiation_dict": {
|
|
"offset": "two rows below",
|
|
"item": "bagel seasoning"
|
|
},
|
|
"intent": "Can you add the item two rows below the bagel seasoning to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Yemeni Hawayij"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 62,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 197,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/clothing.html?p=10",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the item {{offset}} the {{item}} to my cart?",
|
|
"instantiation_dict": {
|
|
"offset": "one row up and one column left of",
|
|
"item": "red and white polka dot romper"
|
|
},
|
|
"intent": "Can you add the item one row up and one column left of the red and white polka dot romper to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Sweatshirt for Men Long Sleeve Turn Down Collar Spring Summer Printed Casual Slim Fit Button Down Shirts Tops T-Shirts"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 62,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 198,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-electronics/printers-accessories.html?product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the item {{offset}} the {{item}} to my cart?",
|
|
"instantiation_dict": {
|
|
"offset": "in the same column but at the bottom of the page as",
|
|
"item": "HP M225DW LaserJet Pro MFP printer"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent": "Can you add the item in the same column but at the bottom of the page as the HP M225DW LaserJet Pro MFP printer to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Flat Scanner Cable for HP LJ Pro M1212NF 1212 1213 1216 1217 1218 121X Printer"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 62,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 199,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/home-decor-products/home-decor-accents.html",
|
|
"geolocation": null,
|
|
"intent_template": "How much does the {{item}} weigh (in {{units}})?",
|
|
"instantiation_dict": {
|
|
"item": "product with an animal on a cube",
|
|
"units": "pounds"
|
|
},
|
|
"intent": "How much does the product with an animal on a cube weigh (in pounds)?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"1.72 |OR| 1.5"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "1.72 pounds"
|
|
},
|
|
"intent_template_id": 63,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 200,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/dairy-cheese-eggs/cheese.html",
|
|
"geolocation": null,
|
|
"intent_template": "How much does the {{item}} weigh (in {{units}})?",
|
|
"instantiation_dict": {
|
|
"item": "cheese with the orange rind",
|
|
"units": "pounds"
|
|
},
|
|
"intent": "How much does the cheese with the orange rind weigh (in pounds)?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"1"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "1 pounds"
|
|
},
|
|
"intent_template_id": 63,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 201,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/playstation-4/accessories.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "How much does the {{item}} weigh (in {{units}})?",
|
|
"instantiation_dict": {
|
|
"item": "PS4 sticker with a skull",
|
|
"units": "ounces"
|
|
},
|
|
"intent": "How much does the PS4 sticker with a skull weigh (in ounces)?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"3.84"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "3.84 ounces"
|
|
},
|
|
"intent_template_id": 63,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 202,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/patio-furniture-accessories.html",
|
|
"geolocation": null,
|
|
"intent_template": "What colors do the {{item}} come in?",
|
|
"instantiation_dict": {
|
|
"item": "patio set with the mountains in the background"
|
|
},
|
|
"intent": "What colors do the patio set with the mountains in the background come in?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Aegean Blue",
|
|
"Black&khaki |OR| Black & Khaki",
|
|
"Blue",
|
|
"Red",
|
|
"Royal Blue"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Aegean Blue, Black & Khaki, Blue, Red, Royal Blue"
|
|
},
|
|
"intent_template_id": 64,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 203,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image url from an item on this page showing {{action}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"action": "how a phone might be stored",
|
|
"item": "with the red shorts"
|
|
},
|
|
"intent": "Can you return an image url from an item on this page showing how a phone might be stored with the red shorts?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09QQNVKTN.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09QQNVKTN.1.jpg"
|
|
},
|
|
"intent_template_id": 65,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 204,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html?price=0-100&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image url from an item on this page showing {{action}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"action": "how someone might touch their toes",
|
|
"item": "in the gray tank top"
|
|
},
|
|
"intent": "Can you return an image url from an item on this page showing how someone might touch their toes in the gray tank top?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There is no image of the guy in the gray tank top touching his toes.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 65,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 205,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/bedding/kids-bedding.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image url from an item on this page showing {{action}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"action": "how someone might cuddle their dog",
|
|
"item": "in the unicorn blanket"
|
|
},
|
|
"intent": "Can you return an image url from an item on this page showing how someone might cuddle their dog in the unicorn blanket?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09MB3WDF5.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09MB3WDF5.1.jpg"
|
|
},
|
|
"intent_template_id": 65,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 206,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/bedding/kids-bedding.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image url from an item on this page showing {{action}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"action": "how",
|
|
"item": "the celebrity blanket might look when folded"
|
|
},
|
|
"intent": "Can you return an image url from an item on this page showing how the celebrity blanket might look when folded?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B08L4ZV4GX.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B08L4ZV4GX.1.jpg"
|
|
},
|
|
"intent_template_id": 65,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 207,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breakfast-foods/cereals.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "What is the name of the monster on that {{color}} box in the bottom row?",
|
|
"instantiation_dict": {
|
|
"color": "blue"
|
|
},
|
|
"intent": "What is the name of the monster on that blue box in the bottom row?",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Boo Berry"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Boo Berry"
|
|
},
|
|
"intent_template_id": 66,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 208,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breakfast-foods/cereals.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "What is the name of the monster on that {{color}} box in the bottom row?",
|
|
"instantiation_dict": {
|
|
"color": "brown"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent": "What is the name of the monster on that brown box in the bottom row?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"Count Chocula |OR| COUNT CHOCULA"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Count Chocula"
|
|
},
|
|
"intent_template_id": 66,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 209,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breakfast-foods/cereals.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "What is the name of the monster on that {{color}} box in the bottom row?",
|
|
"instantiation_dict": {
|
|
"color": "green"
|
|
},
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent": "What is the name of the monster on that green box in the bottom row?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There is no green box.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 66,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 210,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breakfast-foods/cereals.html?p=9",
|
|
"geolocation": null,
|
|
"intent_template": "How many {{attribute}} does the box with the {{object}} have?",
|
|
"instantiation_dict": {
|
|
"attribute": "vitamins and minerals",
|
|
"object": "unicorn"
|
|
},
|
|
"intent": "How many vitamins and minerals does the box with the unicorn have?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"12"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "12 vitamins and minerals"
|
|
},
|
|
"intent_template_id": 67,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 211,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breakfast-foods/cereals.html?p=11",
|
|
"geolocation": null,
|
|
"intent_template": "How many {{attribute}} does the box with the {{object}} have?",
|
|
"instantiation_dict": {
|
|
"attribute": "grams of whole grain (per serving)",
|
|
"object": "volleyball player"
|
|
},
|
|
"intent": "How many grams of whole grain (per serving) does the box with the volleyball player have?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"22"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "22 grams"
|
|
},
|
|
"intent_template_id": 67,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 212,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/gardening-lawn-care.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} with {{number}} stars to my cart?",
|
|
"instantiation_dict": {
|
|
"item": "red flower seeds",
|
|
"number": "around 4"
|
|
},
|
|
"intent": "Can you add the red flower seeds with around 4 stars to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Red Roselle Seeds (Hibiscus sabdariffa) 50+ Tropical Hibiscus Seeds Packed in FROZEN SEED CAPSULES for Growing Seeds Now or Saving Seeds for Years"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 68,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 213,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/patio-furniture-accessories.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} with {{number}} stars to my cart?",
|
|
"instantiation_dict": {
|
|
"item": "patio set that has water in the background",
|
|
"number": "the most"
|
|
},
|
|
"intent": "Can you add the patio set that has water in the background with the most stars to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Tuoze 6 Pieces Patio Furniture Sectional Outdoor All Weather PE Rattan Wicker Lawn Conversation Cushioned Garden Sofa Set with Glass Coffee Table (Beige)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 68,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 214,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html?p=23",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} with {{number}} stars to my cart?",
|
|
"instantiation_dict": {
|
|
"item": "photo collage",
|
|
"number": "a little more than 3"
|
|
},
|
|
"intent": "Can you add the photo collage with a little more than 3 stars to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Collage Photo Canvas Prints Custom Multi Personalized Picture with Your Kids Family Wedding Images Customized Wall Art Home Decor for Living Room Bedroom Digital Printed Gifts"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 68,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 215,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html?p=23",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} with {{number}} stars to my cart?",
|
|
"instantiation_dict": {
|
|
"item": "flower picture",
|
|
"number": "4.5"
|
|
},
|
|
"intent": "Can you add the flower picture with 4.5 stars to my cart?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Flowers Home Decorations 3 Panels Purple Lavender Flower Artwork for Living Room Office Bathroom Wall Decor Posters and Prints Frame to Hang (Lavender-2, 12*16inch)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 68,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 216,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/foot-hand-nail-care/nail-art-polish.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} {{condition}} to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "the one",
|
|
"condition": "that looks like a microwave"
|
|
},
|
|
"intent": "Can you add the one that looks like a microwave to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"JJ CARE Sterilizer for Salon 15L Capacity, 2-in1 Sanitizer Box and Dry Heat Sterilizer Cabinet Tabletop with Stainless Tray, Sterilizer Cabinet Sanitizing Machine"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 69,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 217,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/foot-hand-nail-care/nail-art-polish.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "What colors do the {{item}} come in?",
|
|
"instantiation_dict": {
|
|
"item": "mini ring trays"
|
|
},
|
|
"intent": "What colors do the mini ring trays come in?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"purple |OR| violet",
|
|
"yellow |OR| gold",
|
|
"black",
|
|
"pink"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Purple, yellow, black, and pink"
|
|
},
|
|
"intent_template_id": 64,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 218,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/diet-sports-nutrition/nutrition-bars-drinks.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "What colors do the {{item}} come in?",
|
|
"instantiation_dict": {
|
|
"item": "bars in the bottom left"
|
|
},
|
|
"intent": "What colors do the bars in the bottom left come in?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"green",
|
|
"blue",
|
|
"pink",
|
|
"yellow |OR| gold"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "Green, blue, pink, and yellow"
|
|
},
|
|
"intent_template_id": 64,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 219,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/uniforms-work-safety.html",
|
|
"geolocation": null,
|
|
"intent_template": "What {{query}} {{question}}?",
|
|
"instantiation_dict": {
|
|
"query": "are the two types of birds",
|
|
"question": "on the front of that colorful shirt"
|
|
},
|
|
"intent": "What are the two types of birds on the front of that colorful shirt?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"toucan",
|
|
"parrot"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "A toucan and parrots"
|
|
},
|
|
"intent_template_id": 70,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 220,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/tools-accessories/mirrors.html",
|
|
"geolocation": null,
|
|
"intent_template": "How much is the {{item}} with {{secondary_item}} in the picture on this page?",
|
|
"instantiation_dict": {
|
|
"item": "mirror",
|
|
"secondary_item": "the charging cable"
|
|
},
|
|
"intent": "How much is the mirror with the charging cable in the picture on this page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"$30.88"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$30.88"
|
|
},
|
|
"intent_template_id": 61,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 221,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the most expensive {{category}} to my cart that is less than ${{dollars}} and {{color}}?",
|
|
"instantiation_dict": {
|
|
"category": "smartwatch (from the \"Smartwatches\" category)",
|
|
"dollars": "200",
|
|
"color": "not black"
|
|
},
|
|
"intent": "Can you add the most expensive smartwatch (from the \"Smartwatches\" category) to my cart that is less than $200 and not black?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SAMSUNG Galaxy Watch Active 2 (40mm, GPS, Bluetooth) Smart Watch with Advanced Health Monitoring, Fitness Tracking, and Long Lasting Battery - Rose Gold (US Version) (Renewed)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 71,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 222,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the most expensive {{category}} to my cart that is less than ${{dollars}} and {{color}}?",
|
|
"instantiation_dict": {
|
|
"category": "USB adapter for a Switch",
|
|
"dollars": "113",
|
|
"color": "looks like bricks"
|
|
},
|
|
"intent": "Can you add the most expensive USB adapter for a Switch to my cart that is less than $113 and looks like bricks?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"8Bitdo Wireless USB Adapter 1 for Switch, Switch OLED, Windows, Mac & Raspberry Pi, Compatible with Switch Pro, Switch Joy-con, PS5 PS4 Controller and More"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 71,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 223,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add all the {{items}} {{condition}} to my shopping cart?",
|
|
"intent": "Can you add all the amiibo figures that cost less than $50 to my shopping cart?",
|
|
"instantiation_dict": {
|
|
"items": "amiibo figures that cost",
|
|
"condition": "less than $50"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"amiibo SAMUS/E.M.M.I. 2-in-1 Pack (Nintendo Switch)",
|
|
"Nintendo amiibo - Ice Climbers - Super Smash Bros. Series",
|
|
"Nintendo Amiibo - Chrom - Super Smash Bros. Series - Switch",
|
|
"Nintendo Amiibo - Link: The Legend of Zelda: Link's Awakening Series - Switch"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 72,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 224,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "{{information}}. Can you add {{items}} to my cart?",
|
|
"intent": "I did this activity last weekend. Can you add the amiibo most likely to do this to my cart?",
|
|
"instantiation_dict": {
|
|
"information": "I did this activity last weekend",
|
|
"items": "the amiibo most likely to do this"
|
|
},
|
|
"image": "https://images.pexels.com/photos/12985963/pexels-photo-12985963.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Nintendo amiibo - Ice Climbers - Super Smash Bros. Series"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 73,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 225,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/tools-accessories/mirrors.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the product that looks most like {{emojis}} to my cart?",
|
|
"instantiation_dict": {
|
|
"emojis": "\ud83e\udd0d\ud83e\udd0d\ud83e\udd0d"
|
|
},
|
|
"intent": "Can you add the product that looks most like \ud83e\udd0d\ud83e\udd0d\ud83e\udd0d to my cart?",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"FRCOLOR 3pcs Hand Mirror Heart Handheld Mirror Cosmetic Mirror with Handle for Women Travel Hairdresser Salon"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 74,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 226,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/basic-cases.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the product that looks most like {{emojis}} to my cart?",
|
|
"instantiation_dict": {
|
|
"emojis": "\ud83d\udc04"
|
|
},
|
|
"intent": "Can you add the product that looks most like \ud83d\udc04 to my cart?",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"KANGHAR iPhone 12 Tire Cow,iPhone 12 Pro Tire Case Black White Slim Anti-Scratch Shockproof Skid Outline Durable PC Layer TPU Bumper Anti-Dropping Full Body Protection Cover -6.1 Inch"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 74,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 227,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the product that looks most like {{emojis}} to my cart?",
|
|
"instantiation_dict": {
|
|
"emojis": "\ud83d\udc80"
|
|
},
|
|
"intent": "Can you add the product that looks most like \ud83d\udc80 to my cart?",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Canvas Prints All is Vanity Wood Framed Canvas Wall Art Home Office Decor Ready to Hang 16\"x20\""
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 74,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 228,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art.html?p=14",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the product that looks most like {{emojis}} to my cart?",
|
|
"instantiation_dict": {
|
|
"emojis": "a single \ud83c\udf3b"
|
|
},
|
|
"intent": "Can you add the product that looks most like a single \ud83c\udf3b to my cart?",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Bathroom Decor Artwork Black and White Animal Resting Elephant Look Sunflower Field Framed Wall Art Giclee Wall Decor on Canvas Stretched Artwork Living Room Bedroom Ready to Hang,11x14in"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 74,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 229,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/wall-art/posters-prints.html?p=24",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the product that looks most like {{emojis}} to my cart?",
|
|
"instantiation_dict": {
|
|
"emojis": "this pattern: \ud83c\udded\ud83c\uddfa"
|
|
},
|
|
"intent": "Can you add the product that looks most like this pattern: \ud83c\udded\ud83c\uddfa to my cart?",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"When Sick Kids Should Stay Home from School Poster - Laminated, 12x18 in. - Pre-K, Home Daycare Supplies - Elementary School Nurse Office Decor - Pediatric Health"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 74,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 230,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/clothing.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} that look like they are from {{reference}} to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "pants",
|
|
"reference": "the Twister game"
|
|
},
|
|
"intent": "Can you add the pants that look like they are from the Twister game to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"DZQUY Men's Classic Plaid Pants Chinos Stretch Slim Fit Lattice Trousers Casual Running Jogger Business Pencil Dress Pants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 75,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 231,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/clothing.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} that look like they are from {{reference}} to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "boxers",
|
|
"reference": "space"
|
|
},
|
|
"intent": "Can you add the boxers that look like they are from space to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Men's Boxer Briefs Soft Cotton Boxers Cozy Trunks Breathable Underpants Sexy Low Rise Underwear Stretch Ice Silk Panties"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 75,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 232,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/playstation-4/accessories.html?p=9",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add the {{item}} that look like they are from {{reference}} to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "decals",
|
|
"reference": "an anime"
|
|
},
|
|
"intent": "Can you add the decals that look like they are from an anime to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Vanknight Vinyl Decal Skin Stickers Cover for PS4 Console Playstation 2 Controllers"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 75,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 233,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/xbox-one/accessories.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Between {{item1}} and {{item2}}, add the cheaper one to my cart and the other to my wishlist.",
|
|
"instantiation_dict": {
|
|
"item1": "the red and black controller",
|
|
"item2": "the controller with green accents"
|
|
},
|
|
"intent": "Between the red and black controller and the controller with green accents, add the cheaper one to my cart and the other to my wishlist.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Microsoft Xbox One Wireless Controller - Volcano Shadow (Renewed)"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wired Controller for Xbox One, High Performance USB Gamepad Remote Joystick Controller with Dual Vibration and Audio Jack for Xbox One/X/S and PC Windows 7/8/10 (Black)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 76,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 234,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/kitchen-dining/kitchen-table-linens.html",
|
|
"geolocation": null,
|
|
"intent_template": "Between {{item1}} and {{item2}}, add the cheaper one to my cart and the other to my wishlist.",
|
|
"instantiation_dict": {
|
|
"item1": "the second item in the top row",
|
|
"item2": "the one below it"
|
|
},
|
|
"intent": "Between the second item in the top row and the one below it, add the cheaper one to my cart and the other to my wishlist.",
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ARTSHOWING Anchor Table Runner and Placemats Set of 6, Burlap Linen Table Runners 13x90inch, Heat-Insulating Placemats for Table Decor, Love The Life You Live"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"13x90'' Table Runner with Placemats Set of 6 Live Every Moment Laugh Every Day Love Beyond Words Honeycomb Yellow Background Non-Slip Washable Table Mats Table Runner Set for Dining Table Home Decor"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 76,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 235,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/kitchen-dining/kitchen-table-linens.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Between {{item1}} and {{item2}}, add the cheaper one to my cart and the other to my wishlist.",
|
|
"instantiation_dict": {
|
|
"item1": "the Japanese style tablecover",
|
|
"item2": "the 3 leaf clover one"
|
|
},
|
|
"intent": "Between the Japanese style tablecover and the 3 leaf clover one, add the cheaper one to my cart and the other to my wishlist.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"GGACEN Decorative Elastic Edged Square Fitted Tablecloth,Miyajima Torii Sumo and Flag Polyester Indoor Outdoor Fitted Tablecover for Banquet Buffet Kitchen Dining and Party Fit Square Table up to 30\""
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"St. Patrick's Day Table Runner 36 Inches Long Farmhouse Dress Scarves, Green Clover Black and White Buffalo Plaid Dining Tablerunner for Coffee Table/Kitchen Island/Party D\u00e9cor, Small 13\" x 36\""
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 76,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 236,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/customer/account/",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "Can you set the {{side}} side address to {{address}}? My phone number is also {{number}}.",
|
|
"instantiation_dict": {
|
|
"side": "right",
|
|
"address": "5000 Forbes Ave, Pittsburgh, PA 15213",
|
|
"number": "(412) 268-2000"
|
|
},
|
|
"intent": "Can you set the right side address to 5000 Forbes Ave, Pittsburgh, PA 15213? My phone number is also (412) 268-2000.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/account/",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.columns > div.column.main > div.block.block-dashboard-addresses > div.block-content > div.box.box-shipping-address > div.box-content > address').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"5000 Forbes Ave",
|
|
"Pittsburgh",
|
|
"Pennsylvania",
|
|
"15213",
|
|
"(412) 268-2000 |OR| 4122682000 |OR| 412-268-2000"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 77,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 237,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/customer/account/",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "Can you set the {{side}} side address to {{address}}? My phone number is also {{number}}.",
|
|
"instantiation_dict": {
|
|
"side": "left",
|
|
"address": "201 N Goodwin Ave in Urbana Illinois 61801",
|
|
"number": "2173333426"
|
|
},
|
|
"intent": "Can you set the left side address to 201 N Goodwin Ave in Urbana Illinois 61801? My phone number is also 2173333426.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/account/",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.columns > div.column.main > div.block.block-dashboard-addresses > div.block-content > div.box.box-billing-address > div.box-content > address').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"201 N Goodwin Ave",
|
|
"Urbana",
|
|
"Illinois",
|
|
"61801",
|
|
"(217) 333-3426 |OR| 2173333426 |OR| 217-333-3426"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 77,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 238,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/flip-cases.html?p=3",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "From {{location}}, can you add the two items with the best ratings to my cart, and the others to my wishlist?",
|
|
"instantiation_dict": {
|
|
"location": "the third column"
|
|
},
|
|
"intent": "From the third column, can you add the two items with the best ratings to my cart, and the others to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SafeSleeve EMF Protection Anti Radiation iPhone Case: iPhone 12 and iPhone 12 Pro RFID EMF Blocking Wallet Cell Phone Case (Black)"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"ONETOP Compatible with iPhone 12 Compatible with iPhone 12 Pro Wallet Case with Card Holder, PU Leather Kickstand Card Slots Case, Double Magnetic Clasp Durable Shockproof Cover 6.1 Inch(Blue)",
|
|
"LUPA iPhone X Case with Card Holder -Slim & Lightweight iPhone X Wallet Case - for Women & Men - Faux Leather - iPhone Xs Cases with Magnetic Closure\u2013 Light Brown (5.8 Inch Diagonal Screen Size)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 78,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 239,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves/basic-cases.html?p=12",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "From {{location}}, can you add the two items with the best ratings to my cart, and the others to my wishlist?",
|
|
"instantiation_dict": {
|
|
"location": "the top row"
|
|
},
|
|
"intent": "From the top row, can you add the two items with the best ratings to my cart, and the others to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Samsung Galaxy A71 5G Case Flash Ultrathin Silicone Soft Case, Flower, Intimate Butterfly Flash Stand, Samsung A71 5G Mobile Case (not Applicable to A71 4G) (Rose Gold)",
|
|
"Square iPhone 11 Case,Tzomsze Cute Full Camera Lens Protection & Electroplate Reinforced Corners Shockproof Edge Bumper Case Compatible with iPhone 11 [6.1 inches] -Candy Pink"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Case for iPhone SE 2020 iPhone 7 8 for Boys Teen, Itsfaxinke Soft Sturdy Slim Anti Scratch Durable Shell Nonslip Flexible iPhone SE2 2nd Generation Phone Cover (RBshark)",
|
|
"GVIEWIN Designed for iPhone 13 Case 6.1 Inch 2021, Clear Flower Soft & Flexible TPU Shockproof Women Girls Phone Cover Floral Pattern Design Bumper Protective Case\uff08Magnolia/White\uff09"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 78,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 240,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/playstation-systems.html?p=2&product_list_limit=15&product_list_mode=list",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} {{condition}} to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "the items",
|
|
"condition": "corresponding to the prime numbered positions on this page"
|
|
},
|
|
"intent": "Can you add the items corresponding to the prime numbered positions on this page to my wishlist?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Orange Chrome Mirror Vinyl Decal Faceplate Mod Skin Kit for Sony PlayStation Portable 3000 Console by System Skins",
|
|
"PS3 Controller Wireless Bluetooth PlayStation 3 Remote with Charger Cable (White+Blue)",
|
|
"UUShop Protective Vinyl Skin Sticker Decal Warp for Sony Playstation VR Skull",
|
|
"Extreme Sim Racing Wheel Stand Cockpit SXT V2 Racing Simulator - Racing Wheel Stand Black Edition For Logitech G25, G27, G29, G920, Thrustmaster And Fanatec - Heavy Dutty and Foldable",
|
|
"PS4 Slim Skins - Decals for PS4 Controller Playstation 4 Slim - Stickers Cover for PS4 Slim Controller Sony Playstation Four Slim Accessories with Dualshock 4 Two Controllers Skin - Deadpool",
|
|
"Game Controller Stand Holder Wall Mount - 2 Pack for Gaming&Audio Headsets Holder Hook, Controller Headset Stand Holder for PS5/PS4/Xbox Gamer Gifts,No Screws, Easy to Install - Black"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 69,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 241,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/deli-prepared-foods/deli-meats-cheeses.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image link showing the {{item}} in another angle?",
|
|
"instantiation_dict": {
|
|
"item": "Serrano Ham Bone"
|
|
},
|
|
"intent": "Can you return an image link showing the Serrano Ham Bone in another angle?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B074DKNVPL.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B074DKNVPL.1.jpg"
|
|
},
|
|
"intent_template_id": 79,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 242,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/heating-cooling-air-quality.html?p=4",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "Can you return an image link of the {{item}} in another angle?",
|
|
"instantiation_dict": {
|
|
"item": "fireplace in the bottom left"
|
|
},
|
|
"intent": "Can you return an image link of the fireplace in the bottom left in another angle?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07H3K871G.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07H3K871G.1.jpg"
|
|
},
|
|
"intent_template_id": 80,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 243,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop/clothing.html?p=8",
|
|
"geolocation": null,
|
|
"intent_template": "Can you return an image link of the {{item}} in another angle?",
|
|
"instantiation_dict": {
|
|
"item": "black and white mens shirt"
|
|
},
|
|
"intent": "Can you return an image link of the black and white mens shirt in another angle?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B09JSYYC12.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09JSYYC12.1.jpg"
|
|
},
|
|
"intent_template_id": 80,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 244,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/health-care.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "{{information}}. Can you add {{items}} to my cart?",
|
|
"intent": "I am going to this place soon. Can you add the most practical item for my trip on this page to my cart?",
|
|
"instantiation_dict": {
|
|
"information": "I am going to this place soon",
|
|
"items": "the most practical item for my trip on this page"
|
|
},
|
|
"image": "https://images.pexels.com/photos/975771/pexels-photo-975771.jpeg",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"OFF! Deep Woods Mosquito and Insect Repellent Wipes, Long lasting, 12 Individually Wrapped Wipes (1)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 73,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 245,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/health-care.html?p=7",
|
|
"geolocation": null,
|
|
"intent_template": "{{information}}. Can you add {{items}} to my cart?",
|
|
"intent": "I am going to this place soon. Can you add the most practical footwear for my trip on this page to my cart?",
|
|
"instantiation_dict": {
|
|
"information": "I am going to this place soon",
|
|
"items": "the most practical footwear for my trip on this page"
|
|
},
|
|
"image": "https://images.pexels.com/photos/5721397/pexels-photo-5721397.jpeg",
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Spenco Men's Tribal Elite Sandal"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 73,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 246,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/keychron-k10-full-size-104-keys-bluetooth-wireless-usb-wired-mechanical-gaming-keyboard-for-mac-with-gateron-brown-switch-multitasking-white-led-backlight-computer-keyboard-for-windows-laptop.html",
|
|
"geolocation": null,
|
|
"intent_template": "This would make a great birthday gift for my friend! Can you order another one on this site {{modification}} to {{address}}? My phone number is also {{number}} in case it is needed.",
|
|
"instantiation_dict": {
|
|
"modification": "from this brand that most fits his black/white themed setup",
|
|
"address": "353 Jane Stanford Way in Stanford, Cali 94305",
|
|
"number": "(650) 555-0111"
|
|
},
|
|
"intent": "This would make a great birthday gift for my friend! Can you order another one on this site from this brand that most fits his black/white themed setup to 353 Jane Stanford Way in Stanford, Cali 94305? My phone number is also (650) 555-0111 in case it is needed.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08CNBF28Z |OR| B08CN9ZV2N"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \"#maincontent > div.columns > div.column.main > div.block.block-order-details-view > div.block-content > div.box.box-order-shipping-address > div > address\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"353 Jane Stanford Way",
|
|
"Stanford",
|
|
"California",
|
|
"94305",
|
|
"(650) 555-0111 |OR| 6505550111 |OR| 650-555-0111"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 81,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/keychron-c2-full-size-wired-mechanical-keyboard-for-mac-hot-swappable-gateron-g-pro-blue-switch-white-backlight-104-keys-abs-keycaps-gaming-keyboard-for-windows-type-c-braid-cable.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 247,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/shop-succulents-assorted-collection-variety-set-of-hand-selected-fully-rooted-live-indoor-succulent-plants-6-pack.html",
|
|
"geolocation": null,
|
|
"intent_template": "This would make a great birthday gift for my friend! Can you order another one on this site {{modification}} to {{address}}? My phone number is also {{number}} in case it is needed.",
|
|
"instantiation_dict": {
|
|
"modification": "of a single plant that looks most like the middle right plant in the first picture",
|
|
"address": "3235 Voigt Dr, La Jolla, CA 92093",
|
|
"number": "(858) 555-0172"
|
|
},
|
|
"intent": "This would make a great birthday gift for my friend! Can you order another one on this site of a single plant that looks most like the middle right plant in the first picture to 3235 Voigt Dr, La Jolla, CA 92093? My phone number is also (858) 555-0172 in case it is needed.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09QXD1DVY |OR| B07C988M51"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \"#maincontent > div.columns > div.column.main > div.block.block-order-details-view > div.block-content > div.box.box-order-shipping-address > div > address\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"3235 Voigt",
|
|
"La Jolla",
|
|
"California",
|
|
"92093",
|
|
"(858) 555-0172 |OR| 8585550172 |OR| 858-555-0172"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 81,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 248,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/snacks-sweets/chocolate.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Order {{product}}. If the shipping is more than 7% of the total price, leave a 3 star review mentioning it, otherwise 5.",
|
|
"instantiation_dict": {
|
|
"product": "a 6 pack of the green chocolate bars"
|
|
},
|
|
"intent": "Order a 6 pack of the green chocolate bars. If the shipping is more than 7% of the total price, leave a 3 star review mentioning it, otherwise 5.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09PQ6G5WL",
|
|
"6 Pack"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating(\"B09PQ6G5WL\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"60"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 82,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 249,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/patio-furniture-accessories.html",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "Order {{product}}. If the shipping is more than 7% of the total price, leave a 3 star review mentioning it, otherwise 5.",
|
|
"instantiation_dict": {
|
|
"product": "the second thing in the top row"
|
|
},
|
|
"intent": "Order the second thing in the top row. If the shipping is more than 7% of the total price, leave a 3 star review mentioning it, otherwise 5.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07SYHF5R2"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating(\"B07SYHF5R2\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"100"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 82,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 250,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/headphones/earbud-headphones.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "I have {{subjects}}, can you order enough {{product}} so each can get their own?",
|
|
"instantiation_dict": {
|
|
"subjects": "twin sons",
|
|
"product": "soccer ball earbuds"
|
|
},
|
|
"intent": "I have twin sons, can you order enough soccer ball earbuds so each can get their own?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09G6MGFPZ"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__, \"B09G6MGFPZ\")",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 2"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 83,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 251,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/alcoholic-beverages/wine.html",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "I have {{subjects}}, can you order enough {{product}} so each can get their own?",
|
|
"instantiation_dict": {
|
|
"subjects": "a dozen wedding guests",
|
|
"product": "of the (non-alcoholic) white wine in the first row"
|
|
},
|
|
"intent": "I have a dozen wedding guests, can you order enough of the (non-alcoholic) white wine in the first row so each can get their own?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B005J0KH2C"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__, \"B005J0KH2C\")",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 12"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 83,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 252,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/nintendo-systems.html",
|
|
"geolocation": null,
|
|
"intent_template": "I have {{subjects}}, can you order enough {{product}} so each can get their own?",
|
|
"instantiation_dict": {
|
|
"subjects": "octuplets on the way",
|
|
"product": "white wii remotes"
|
|
},
|
|
"intent": "I have octuplets on the way, can you order enough white wii remotes so each can get their own?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B091YR9XRH"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__, \"B091YR9XRH\")",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 4"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 83,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 253,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order {{product}} and let me know the final price?",
|
|
"instantiation_dict": {
|
|
"product": "a wii remote with an M logo"
|
|
},
|
|
"intent": "Can you order a wii remote with an M logo and let me know the final price?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"94.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07BZRFNL8"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$94.99"
|
|
},
|
|
"intent_template_id": 84,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 254,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-school-supplies/desk-accessories-workspace-organizers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order {{product}} and let me know the final price?",
|
|
"instantiation_dict": {
|
|
"product": "the product below the lady in the red shirt"
|
|
},
|
|
"intent": "Can you order the product below the lady in the red shirt and let me know the final price?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"200"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B073BL7NH7"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$200.00"
|
|
},
|
|
"intent_template_id": 84,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 255,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-furniture-lighting/chairs-sofas.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order {{product}} and let me know the final price?",
|
|
"instantiation_dict": {
|
|
"product": "two of the chair with the spine graphic in black"
|
|
},
|
|
"intent": "Can you order two of the chair with the spine graphic in black and let me know the final price?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"689.98"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07WS7YJLJ",
|
|
"Black"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_order_product_quantity(__page__, \"B07WS7YJLJ\")",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"== 2"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$689.98"
|
|
},
|
|
"intent_template_id": 84,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 256,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/aroy-d-longan-in-syrup-20oz-565g-2-pack.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{items}} to the comparison page?",
|
|
"instantiation_dict": {
|
|
"items": "this and the other canned fruit (of the same brand) that looks like this, but red instead of brown"
|
|
},
|
|
"intent": "Can you add this and the other canned fruit (of the same brand) that looks like this, but red instead of brown to the comparison page?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/catalog/product_compare",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Aroy-D Longan in Syrup 20oz (565g), 2 pack",
|
|
"Aroy-d Rambutan in Syrup (Pack of 6)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 33,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 257,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} {{condition}} to my wishlist?",
|
|
"intent": "Can you add a light fixture (from the \"Wall Lights\" section) that looks like \ud83c\udf39 to my wishlist?",
|
|
"instantiation_dict": {
|
|
"item": "a light fixture (from the \"Wall Lights\" section)",
|
|
"condition": "that looks like \ud83c\udf39"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Accent Plus 10018784 Romantic Roses Wall Sconce, White"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 69,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 258,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/novelty-more/clothing.html?p=13",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the item on this page that is cheaper between {{item1}} and {{item2}} and just leave the other one in my cart? My size is {{size}}.",
|
|
"instantiation_dict": {
|
|
"item1": "the anime shirt",
|
|
"item2": "the orange text top",
|
|
"size": "large"
|
|
},
|
|
"intent": "Can you order the item on this page that is cheaper between the anime shirt and the orange text top and just leave the other one in my cart? My size is large.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07FDS25SN",
|
|
"Large"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Mom Come Pick Me Up Hoodie, Sweatshirt With Word On Back Trendy, Funny Positive Word On Trendy Hoodie, Tumblr Hoodie, Quotes Shirts For Men"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 85,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 259,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/novelty-more/clothing.html?p=23&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the item on this page that is cheaper between {{item1}} and {{item2}} and just leave the other one in my cart? My size is {{size}}.",
|
|
"instantiation_dict": {
|
|
"item1": "the shirt with a bloody hand (in any color)",
|
|
"item2": "the red dress",
|
|
"size": "XXL"
|
|
},
|
|
"intent": "Can you order the item on this page that is cheaper between the shirt with a bloody hand (in any color) and the red dress and just leave the other one in my cart? My size is XXL.",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09LLW8MWL"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "func:get_query_text(__page__, \"#shopping-cart-table\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Floral Lace Up Gothic Punk Dress for Womens Steampunk Vintage Lolita Spaghetti Strap High Low Dresses",
|
|
"Red",
|
|
"XX-Large"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 85,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 260,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/computers-accessories/computer-accessories-peripherals.html?product_list_order=name&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the {{item}} {{condition}}?",
|
|
"instantiation_dict": {
|
|
"item": "charger protectors",
|
|
"condition": "if it includes a bubble tea in the pack"
|
|
},
|
|
"intent": "Can you order the charger protectors if it includes a bubble tea in the pack?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0953QS3ZX"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 86,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 261,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/computers-accessories/computer-accessories-peripherals.html?product_list_order=name&product_list_limit=36",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the {{item}} {{condition}}?",
|
|
"image": "https://images.pexels.com/photos/1613621/pexels-photo-1613621.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "charger protectors",
|
|
"condition": "if it includes this thing I found on the beach in the pack"
|
|
},
|
|
"intent": "Can you order the charger protectors if it includes this thing I found on the beach in the pack?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09PCY8QQJ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 86,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 262,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/makeup/face.html?p=6&product_list_limit=24&product_list_order=name",
|
|
"geolocation": null,
|
|
"intent_template": "Can you leave a {{number}} star review on {{product}} saying \"{{review}}\"?",
|
|
"instantiation_dict": {
|
|
"number": "5",
|
|
"product": "the palette with a flower on it",
|
|
"review": "My daughter absolutely loves it!! Would recommend to anyone"
|
|
},
|
|
"intent": "Can you leave a 5 star review on the palette with a flower on it saying \"My daughter absolutely loves it!! Would recommend to anyone\"?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_rating(\"B09QYJJNW2\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"100"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_text(\"B09QYJJNW2\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"My daughter absolutely loves it!! Would recommend to anyone"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 87,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/beauty-personal-care/makeup/face/eyeshadow/eyeshadow-palettes/colourpop-garden-variety-eyeshadow-palette.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 263,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you leave a {{number}} star review on {{product}} saying \"{{review}}\"?",
|
|
"instantiation_dict": {
|
|
"number": "2",
|
|
"product": "the most expensive CoComelon blanket set (from the \"Kids' Bedding\" category)",
|
|
"review": "I was expecting more for the price, started to fall apart after a few days"
|
|
},
|
|
"intent": "Can you leave a 2 star review on the most expensive CoComelon blanket set (from the \"Kids' Bedding\" category) saying \"I was expecting more for the price, started to fall apart after a few days\"?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_rating(\"B097YHDSVG\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"40"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_text(\"B097YHDSVG\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"I was expecting more for the price, started to fall apart after a few days"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 87,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/jerfyut-cartoon-bedding-sets-twin-duvet-cover-3-piece-cute-bed-set-for-boys-girls-kid-with-1-duvet-cover-2-pillowcase-bed-sheets.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 264,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=bonsai&product_list_order=name",
|
|
"geolocation": null,
|
|
"intent_template": "Can you leave a {{number}} star review on {{product}} saying \"{{review}}\"?",
|
|
"instantiation_dict": {
|
|
"number": "4",
|
|
"product": "the most expensive plant that looks like the hands of a clock at 6:40",
|
|
"review": "I love this plant! It's so unique and I get so many compliments on it! The only downside is that it's a little hard to take care of."
|
|
},
|
|
"intent": "Can you leave a 4 star review on the most expensive plant that looks like the hands of a clock at 6:40 saying \"I love this plant! It's so unique and I get so many compliments on it! The only downside is that it's a little hard to take care of.\"?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_rating(\"B095NHLW6F\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"80"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__",
|
|
"locator": "func:shopping_get_sku_latest_review_text(\"B095NHLW6F\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"I love this plant! It's so unique and I get so many compliments on it! The only downside is that it's a little hard to take care of."
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 87,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 265,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the cheapest thing {{item}}?",
|
|
"image": "https://images.pexels.com/photos/14038782/pexels-photo-14038782.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "like the thing on her shoulder (in the same color)"
|
|
},
|
|
"intent": "Can you order the cheapest thing like the thing on her shoulder (in the same color)?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B000FHD7PI"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 88,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/sony-zsh10cp-portable-heavy-duty-cd-radio-boombox-speaker-system-discontinued-by-manufacturer.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 266,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the cheapest thing {{item}}?",
|
|
"image": "https://images.pexels.com/photos/9137660/pexels-photo-9137660.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "from the \"GPS System Accessories\" category to protect the display touch screen on my car (which is in the picture)"
|
|
},
|
|
"intent": "Can you order the cheapest thing from the \"GPS System Accessories\" category to protect the display touch screen on my car (which is in the picture)?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07SFY2VNB"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 88,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/lfotpp-fit-for-2019-2020-2021-silverado-1500-infotainment-3-8-inch-car-navigation-screen-protector-tempered-glass-9h-hardness-car-infotainment-display-center-touchscreen-protective-film-scratch-resistant.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 267,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/pc/accessories.html?p=4&product_list_order=price",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} to my cart and take me to the final checkout screen before placing the order?",
|
|
"instantiation_dict": {
|
|
"item": "the RGB headset"
|
|
},
|
|
"intent": "Can you add the RGB headset to my cart and take me to the final checkout screen before placing the order?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/checkout/#payment",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/#payment",
|
|
"locator": "func:get_query_text(__page__, \"#opc-sidebar > div.opc-block-summary > div > div.content.minicart-items > div > ol\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"RAFIKI Gaming Headset with Microphone for PS4, PS5, Laptop, PC,Mobile Phone,7.1 Surround Sound Headphones,Memory Foam Ear Pads LED Lights, Self-Adjusting Over Ear Headset"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 89,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 268,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/skin-care/maternity.html?p=6&product_list_limit=36&product_list_order=name",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} to my cart and take me to the final checkout screen before placing the order?",
|
|
"instantiation_dict": {
|
|
"item": "the thing that says 777 in any color"
|
|
},
|
|
"intent": "Can you add the thing that says 777 in any color to my cart and take me to the final checkout screen before placing the order?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/checkout/#payment",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/#payment",
|
|
"locator": "func:get_query_text(__page__, \"#opc-sidebar > div.opc-block-summary > div > div.content.minicart-items > div > ol\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"YYDS Women Sterling silver Digital Pendant Necklace Number Pendant Necklace Stainless Steel Friendship Necklace"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 89,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 269,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} to my cart and take me to the final checkout screen before placing the order?",
|
|
"instantiation_dict": {
|
|
"item": "the cheapest live lobster that doesn't have a lemon in its picture"
|
|
},
|
|
"intent": "Can you add the cheapest live lobster that doesn't have a lemon in its picture to my cart and take me to the final checkout screen before placing the order?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/checkout/#payment",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/#payment",
|
|
"locator": "func:get_query_text(__page__, \"#opc-sidebar > div.opc-block-summary > div > div.content.minicart-items > div > ol\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Live Wild Caught Maine Lobster Approx. (1.5 lb. ea., 6 lobsters about 10lb) Express Shipped Chilled"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 89,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 270,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/tools-home-improvement/lighting-ceiling-fans/wall-lights.html",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{item}} to my cart and take me to the final checkout screen before placing the order?",
|
|
"instantiation_dict": {
|
|
"item": "the lamp that looks like an upside down matcha whisk"
|
|
},
|
|
"intent": "Can you add the lamp that looks like an upside down matcha whisk to my cart and take me to the final checkout screen before placing the order?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match",
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/checkout/#payment",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/#payment",
|
|
"locator": "func:get_query_text(__page__, \"#opc-sidebar > div.opc-block-summary > div > div.content.minicart-items > div > ol\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Baoblaze Retro Bamboo Wall Lamp Sconce E27 LED Lighting Fixtures Weave Creative Novelty Night Lights for Restaurant Home Aisle Tea Room Decoration"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 89,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 271,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/furniture/bedroom-furniture.html?p=5&product_list_limit=36&product_list_order=name",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}} {{item}} to my cart and order it only if the total comes out to less than {{amount}}?",
|
|
"instantiation_dict": {
|
|
"modifier": "Can you add",
|
|
"item": "the bed with a slide in white in the triple bunk + 2 drawers configuration",
|
|
"amount": "$1000"
|
|
},
|
|
"intent": "Can you add the bed with a slide in white in the triple bunk + 2 drawers configuration to my cart and order it only if the total comes out to less than $1000?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09QSHGPLH",
|
|
"White",
|
|
"Triple Bunk Bed with 2 Drawers"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 90,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 272,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}} {{item}} to my cart and order it only if the total comes out to less than {{amount}}?",
|
|
"instantiation_dict": {
|
|
"modifier": "Can you search for \"Cheerios\", and add",
|
|
"item": "the family sized blue Cheerios cereal",
|
|
"amount": "$43"
|
|
},
|
|
"intent": "Can you search for \"Cheerios\", and add the family sized blue Cheerios cereal to my cart and order it only if the total comes out to less than $43?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Frosted Cheerios Breakfast Cereal with Oats, Gluten Free, 18.4 oz (Pack of 7)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 90,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 273,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen/heating-cooling-air-quality.html?product_list_order=price#",
|
|
"geolocation": null,
|
|
"intent_template": "{{modifier}} {{item}} to my cart and order it only if the total comes out to less than {{amount}}?",
|
|
"instantiation_dict": {
|
|
"modifier": "Can you add",
|
|
"item": "the Santa humidifier",
|
|
"amount": "63 quarters"
|
|
},
|
|
"intent": "Can you add the Santa humidifier to my cart and order it only if the total comes out to less than 63 quarters?",
|
|
"require_reset": true,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"4L Humidifiers for Bedroom - Top Fill Air Humidifier for Large Room, Auto Shut-off Cool Mist Humidifier, Essential-Oil Diffuser, LED Display, Constant Humidity, Mist Mode for Home, Office, Plants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 90,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 274,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/portable-audio-video/mp3-mp4-player-accessories.html?p=3&product_list_order=name",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the {{item}} {{condition}}?",
|
|
"instantiation_dict": {
|
|
"item": "item",
|
|
"condition": "that will make me look like \ud83d\udc31 in \ud83d\udfe6"
|
|
},
|
|
"intent": "Can you order the item that will make me look like \ud83d\udc31 in \ud83d\udfe6?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09PBQVWK1",
|
|
"Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 86,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 275,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "character",
|
|
"item": "on a phone case"
|
|
},
|
|
"intent": "Can you take me to the page that has this character on a phone case?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09MVYYCCV.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/anime-girls-phone-case-nezuko-phone-case-anime-phone-case-for-iphone-12-compatible-from-iphone-7-series-to-13-series-cases-comes-with-a-keychain-mdz-12.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 276,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "character",
|
|
"item": "on a PS4 controller"
|
|
},
|
|
"intent": "Can you take me to the page that has this character on a PS4 controller?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B0777KDV5J.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/vanknight-playstation-4-dualshock-ps4-controller-skin-vinyl-decals-skins-stickers-2-pack-for-ps4-controller-skins-ps4-skins-deadpool.html |OR| __SHOPPING__/ps4-slim-skins-decals-for-ps4-controller-playstation-4-slim-stickers-cover-for-ps4-slim-controller-sony-playstation-four-slim-accessories-with-dualshock-4-two-controllers-skin-deadpool.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 277,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "animal",
|
|
"item": "on a blanket"
|
|
},
|
|
"intent": "Can you take me to the page that has this animal on a blanket?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B001U5URUC.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/duise-flannel-throw-blanket-cute-donkey-pattern-print-blanket-soft-and-comfortable-flannel-decorative-throw-blankets-for-couch-sofa-bed-throw-50-x60-flannel-fleece-blanket-for-bedroom-livingroom.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 278,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "top left character",
|
|
"item": "as a flash drive"
|
|
},
|
|
"intent": "Can you take me to the page that has this top left character as a flash drive?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B01MXKU7JF.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/cute-lovely-cartoon-usb-2-0-flash-drive-8gb-minnie-mouse.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 279,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "video game character",
|
|
"item": "on slippers"
|
|
},
|
|
"intent": "Can you take me to the page that has this video game character on slippers?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09PPRDWBX.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an item is not available on OneStopMarket."
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 280,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you take me to the page that has this {{subject}} {{item}}?",
|
|
"instantiation_dict": {
|
|
"subject": "cute character",
|
|
"item": "on a short sleeved t-shirt"
|
|
},
|
|
"intent": "Can you take me to the page that has this cute character on a short sleeved t-shirt?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B09GCG7RGC.0.jpg",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "Such an item is not available on OneStopMarket."
|
|
},
|
|
"intent_template_id": 91,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 281,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/shoes.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the shoes on this page that I would most likely wear if I was in the image{{size}}?",
|
|
"instantiation_dict": {
|
|
"size": ""
|
|
},
|
|
"image": "https://images.pexels.com/photos/358010/pexels-photo-358010.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent": "Can you order the shoes on this page that I would most likely wear if I was in the image?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0041HYWWA"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 92,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 282,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/shoes.html?p=10",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the shoes on this page that I would most likely wear if I was in the image{{size}}?",
|
|
"instantiation_dict": {
|
|
"size": ""
|
|
},
|
|
"image": "https://images.pexels.com/photos/5859769/pexels-photo-5859769.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent": "Can you order the shoes on this page that I would most likely wear if I was in the image?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09CPNW61V"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 92,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 283,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/women/shoes.html?p=12",
|
|
"geolocation": null,
|
|
"intent_template": "Can you order the shoes on this page that I would most likely wear if I was in the image{{size}}?",
|
|
"instantiation_dict": {
|
|
"size": " in a size 8"
|
|
},
|
|
"image": "https://images.pexels.com/photos/1619719/pexels-photo-1619719.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent": "Can you order the shoes on this page that I would most likely wear if I was in the image in a size 8?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B00IGRMOAI",
|
|
"8"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 92,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping",
|
|
"wikipedia"
|
|
],
|
|
"task_id": 284,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__WIKIPEDIA__/wikipedia_en_all_maxi_2022-05/A/Wagyu |AND| __SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "That {{item}} in the Wikipedia page looks delicious! Can you order {{descriptors}} for me in OneStopShop?",
|
|
"instantiation_dict": {
|
|
"item": "second picture",
|
|
"descriptors": "2 pounds of thin slices"
|
|
},
|
|
"intent": "That second picture in the Wikipedia page looks delicious! Can you order 2 pounds of thin slices for me in OneStopShop?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08ZS89DVV",
|
|
"Thin Slices",
|
|
"2lbs"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 93,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 285,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I want to eat this food, but I am {{restriction}}. Can you order the closest thing to this from the \"{{category}}\" category that fits my dietary requirements?",
|
|
"instantiation_dict": {
|
|
"restriction": "vegan",
|
|
"category": "Meat Substitutes"
|
|
},
|
|
"image": "https://images.pexels.com/photos/5602496/pexels-photo-5602496.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent": "I want to eat this food, but I am vegan. Can you order the closest thing to this from the \"Meat Substitutes\" category that fits my dietary requirements?",
|
|
"require_reset": false,
|
|
"reference_url": "",
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "func:get_query_text(__page__, \".order-details-items.ordered\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08KWPWC4Y"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 94,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 286,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add {{items}} to the comparison page?",
|
|
"intent": "Can you add a product like what the person is sitting on to the comparison page?",
|
|
"image": "https://images.pexels.com/photos/4050295/pexels-photo-4050295.jpeg",
|
|
"instantiation_dict": {
|
|
"items": "a product like what the person is sitting on"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "__SHOPPING__/catalog/product_compare/",
|
|
"eval_image_class": ".product-image-photo",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a sofa? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 33,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 287,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=mattress",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{size_attribute}} of the {{product}} with {{attribute}} in {{unit}}?",
|
|
"intent": "What is the width of the futon with carrot pattern in centimeters?",
|
|
"instantiation_dict": {
|
|
"size_attribute": "width",
|
|
"product": "futon",
|
|
"attribute": "carrot pattern",
|
|
"unit": "centimeters"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"90"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "90cm."
|
|
},
|
|
"intent_template_id": 95,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 288,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=reed+diffuser",
|
|
"geolocation": null,
|
|
"intent_template": "Add something like {{item}}, but {{attribute}}, from this page to my wish list.",
|
|
"intent": "Add something like the picture shown, but with rose scent, from this page to my wish list.",
|
|
"image": "https://images.pexels.com/photos/6801190/pexels-photo-6801190.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "the picture shown",
|
|
"attribute": "with rose scent"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Seed Spring Reed Diffuser Set with Sticks,Vanilla Scent Oil for Bedroom Office Gym and Stress Relief, Home Fragrance Products 50 ml / 1.7 oz |OR| Yankee Candle Reed Diffuser, Sun-Drenched Apricot Rose",
|
|
"Rose"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 24,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/seed-spring-reed-diffuser-set-with-sticks-vanilla-scent-oil-for-bedroom-office-gym-and-stress-relief-home-fragrance-products-50-ml-1-7-oz.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 289,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Add {{quantity}} of {{item}} from this page to my shopping cart.",
|
|
"intent": "Add 72 cans of the purple energy drink from this page to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"quantity": "72 cans",
|
|
"item": "the purple energy drink"
|
|
},
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => {try {return Array.from(document.querySelectorAll('.item-info')).find(el => el.textContent.includes('V8 +Energy, Healthy Energy Drink, Steady Energy from Black and Green Tea, Pomegranate Blueberry, 8 Ounce Can ,Pack of 24')).querySelector('input').getAttribute('data-item-qty')} catch (e) {return ' '}})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"3"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 96,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/v8-energy-healthy-energy-drink-steady-energy-from-black-and-green-tea-pomegranate-blueberry-8-ounce-can-pack-of-24.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 290,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=2&q=pillow",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{size_attribute}} of the {{product}} with {{attribute}} in {{unit}}?",
|
|
"intent": "What is the size of the white queen size pillow with grid pattern in inches?",
|
|
"instantiation_dict": {
|
|
"size_attribute": "size",
|
|
"product": "white queen size pillow",
|
|
"attribute": "grid pattern",
|
|
"unit": "inches"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"26",
|
|
"20"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "26*20"
|
|
},
|
|
"intent_template_id": 95,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/wellboo-white-pillowcases-black-and-white-plaid-pillow-cases-large-checkered-pillow-shams-grid-cotton-queen-standard-women-men-teen-boys-girls-buffalo-check-pillowcase-decorative-envelope-closure.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 291,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=2&q=end+table",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{size_attribute}} of the {{product}} with {{attribute}} in {{unit}}?",
|
|
"intent": "What is the feet height of the end table with an alarm clock on it in inches?",
|
|
"instantiation_dict": {
|
|
"size_attribute": "feet height",
|
|
"product": "end table",
|
|
"attribute": "an alarm clock on it",
|
|
"unit": "inches"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"15.75"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "15.75\""
|
|
},
|
|
"intent_template_id": 95,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/lohorfire-silver-mirror-end-table-nightstand-bedside-end-table-with-storage-drawer-accent-table-for-living-room-bedroom-home-furniture-small-place.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 292,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=shirt",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} of {{item}} that has the most similar pattern as {{property}} in the picture in this page?",
|
|
"intent": "What is the price of the shirt that has the most similar pattern as the man is wearing in the picture in this page?",
|
|
"image": "https://images.pexels.com/photos/6963032/pexels-photo-6963032.jpeg",
|
|
"instantiation_dict": {
|
|
"attribute": "price",
|
|
"item": "the shirt",
|
|
"property": "the man is wearing"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"3.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$3.99"
|
|
},
|
|
"intent_template_id": 97,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/mens-casual-plaid-collar-shirt-beach-shirts-for-men-long-t-shirt-men-s-t-shirts-muscle-shirts-mens-graphic-tees.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 293,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=bag+black+white",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} of {{item}} that has the most similar pattern as {{property}} in the picture in this page?",
|
|
"intent": "What is the weight in ounces of the bag that has the most similar pattern as the women is wearing in the picture in this page?",
|
|
"image": "https://images.pexels.com/photos/15543520/pexels-photo-15543520.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"attribute": "weight in ounces",
|
|
"item": "the bag",
|
|
"property": "the women is wearing"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"7.58"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "7.58 Ounces"
|
|
},
|
|
"intent_template_id": 97,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/makeup-cosmetic-bag-black-white-houndstooth-classical-portable-travel-train-case-toiletry-bags-organizer-multifunction-storage.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 294,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=5&q=shirt",
|
|
"geolocation": null,
|
|
"intent_template": "What is the {{attribute}} of {{item}} that has the most similar pattern as {{property}} in the picture in this page?",
|
|
"intent": "What is the price of the shirt that has the most similar pattern as the pillow in the picture in this page?",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B0969WGYKV.1.jpg",
|
|
"instantiation_dict": {
|
|
"attribute": "price",
|
|
"item": "the shirt",
|
|
"property": "the pillow"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"0.99"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "$0.99"
|
|
},
|
|
"intent_template_id": 97,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/mens-t-shirt-men-s-polo-shirts-short-sleeve-tee-basic-sports-t-shirts-floral-zipper-mens-summer-shirt-tops.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 295,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}} that {{attribute}} the picture.",
|
|
"intent": "Find me a rug that has the simliar pattern as the animal in the picture.",
|
|
"image": "https://images.pexels.com/photos/208965/pexels-photo-208965.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "a rug",
|
|
"attribute": "has the simliar pattern as the animal in"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a rug? (yes/no)",
|
|
"answer": "yes"
|
|
},
|
|
{
|
|
"question": "Does this item have a leopard print pattern? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 98,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/modern-area-rugs-brown-cheetah-leopard-5x8-rugs-for-living-room-5x7-clearance.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 296,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}} that {{attribute}} the picture.",
|
|
"intent": "Find me powder to make the beverage that is the same as the picture.",
|
|
"image": "https://images.pexels.com/photos/5947093/pexels-photo-5947093.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "powder to make the beverage",
|
|
"attribute": "is the same as"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "document.querySelector('.page-title').textContent.toLocaleLowerCase()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"matcha |OR| green tea"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 98,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/ryu-mei-japanese-organic-matcha-green-tea-powder-super-food-with-high-level-of-antioxidant-catechin-kyoto-g4-100-2-packs.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 297,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}} that {{attribute}} the picture.",
|
|
"intent": "Find me a hoodie that has the same brand as the one the man is wearing in the picture.",
|
|
"image": "https://images.pexels.com/photos/1989242/pexels-photo-1989242.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "a hoodie",
|
|
"attribute": "has the same brand as the one the man is wearing in"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html",
|
|
"page_image_query"
|
|
],
|
|
"page_image_query": [
|
|
{
|
|
"eval_image_url": "last",
|
|
"eval_image_class": ".fotorama__stage__frame",
|
|
"eval_vqa": [
|
|
{
|
|
"question": "Is this a hoodie? (yes/no)",
|
|
"answer": "yes"
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "document.querySelector('.page-title').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Champion"
|
|
]
|
|
}
|
|
}
|
|
],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": ""
|
|
},
|
|
"intent_template_id": 98,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/ryu-mei-japanese-organic-matcha-green-tea-powder-super-food-with-high-level-of-antioxidant-catechin-kyoto-g4-100-2-packs.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 298,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=champion+hoodie",
|
|
"geolocation": null,
|
|
"intent_template": "What size of {{item}} should I buy if {{condition}}?",
|
|
"intent": "What size of the dark green hoodie in this page should I buy if my chest size is 120 cm?",
|
|
"instantiation_dict": {
|
|
"item": "the dark green hoodie in this page",
|
|
"condition": "my chest size is 120 cm"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"XL |OR| X-Large"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR.",
|
|
"reference_answer_raw_annotation": "XL"
|
|
},
|
|
"intent_template_id": 99,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/champion-men-s-sideline-quarter-zip-pullover-with-woven.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 299,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=under+armor",
|
|
"geolocation": null,
|
|
"intent_template": "What size of {{item}} should I buy if {{condition}}?",
|
|
"intent": "What size of the zip hoodie in this page should I buy if my waist size is 30 inches?",
|
|
"instantiation_dict": {
|
|
"item": "the zip hoodie in this page",
|
|
"condition": "my waist size is 30 inches"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"S |OR| Small"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR.",
|
|
"reference_answer_raw_annotation": "S"
|
|
},
|
|
"intent_template_id": 99,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/under-armor-men-s-sc30-ua-threadborne-full-zip-hoodie.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 300,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/baseball-hoodie-for-boys-teens-men-word-cloud-silhouette.html",
|
|
"geolocation": null,
|
|
"intent_template": "What size of {{item}} should I buy if {{condition}}?",
|
|
"intent": "What size of this item should I buy if my shirt width is 28 and 1/4 inches?",
|
|
"instantiation_dict": {
|
|
"item": "this item",
|
|
"condition": "my shirt width is 28 and 1/4 inches"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"XX-Large |OR| XXLarge |OR| 2X-L |OR| 2XL"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR.",
|
|
"reference_answer_raw_annotation": "XX-Large"
|
|
},
|
|
"intent_template_id": 99,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/baseball-hoodie-for-boys-teens-men-word-cloud-silhouette.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 301,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/jaybee-s-nuts-and-dried-fruits-sweet-dried-pineapple-rings-15-oz-tasty-tropical-dry-fruit-slices-on-the-go-snack-resealable-bag-kosher.html",
|
|
"geolocation": null,
|
|
"intent_template": "How many calories are in {{item}}?",
|
|
"intent": "How many calories are in this item per serving?",
|
|
"instantiation_dict": {
|
|
"item": "this item per serving"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"70"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR.",
|
|
"reference_answer_raw_annotation": "70"
|
|
},
|
|
"intent_template_id": 100,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/jaybee-s-nuts-and-dried-fruits-sweet-dried-pineapple-rings-15-oz-tasty-tropical-dry-fruit-slices-on-the-go-snack-resealable-bag-kosher.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 302,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/q-drinks-ginger-beer-25-4-ounce-12-bottles.html",
|
|
"geolocation": null,
|
|
"intent_template": "How many calories are in {{item}}?",
|
|
"intent": "How many calories are in this item per container?",
|
|
"instantiation_dict": {
|
|
"item": "this item per container"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"280"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR.",
|
|
"reference_answer_raw_annotation": "280"
|
|
},
|
|
"intent_template_id": 100,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/q-drinks-ginger-beer-25-4-ounce-12-bottles.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 303,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/tea-zone-2-lb-strawberry-powder.html",
|
|
"geolocation": null,
|
|
"intent_template": "How many calories are in {{item}}?",
|
|
"intent": "How many calories are in this item per container?",
|
|
"instantiation_dict": {
|
|
"item": "this item per container"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"4200"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "4200"
|
|
},
|
|
"intent_template_id": 100,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/tea-zone-2-lb-strawberry-powder.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 304,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/top-dry-garlic-shrimp-fries-25g-best-taiwanese-gift-top-dry-fresh-stock-taiwan-food-snack.html",
|
|
"geolocation": null,
|
|
"intent_template": "How many calories are in {{item}}?",
|
|
"intent": "How many calories are in this item per serving?",
|
|
"instantiation_dict": {
|
|
"item": "this item per serving"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"117.6 |OR| 117 |OR| 118"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "This task requires OCR and translation.",
|
|
"reference_answer_raw_annotation": "117.6"
|
|
},
|
|
"intent_template_id": 100,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/top-dry-garlic-shrimp-fries-25g-best-taiwanese-gift-top-dry-fresh-stock-taiwan-food-snack.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 305,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=6&q=pineapple",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}} that {{attribute}} the picture.",
|
|
"intent": "Find me the item in this page that has simliar packaging boxes to the ones in the picture.",
|
|
"image": "https://images.pexels.com/photos/7620774/pexels-photo-7620774.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "the item in this page",
|
|
"attribute": "has simliar packaging boxes to the ones in"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/sunny-hills-pineapple-cake-10pcs-500g-best-taiwanese-gift-sunny-hills-fresh-stock-taiwan-food-pineapple-cake.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 98,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/sunny-hills-pineapple-cake-10pcs-500g-best-taiwanese-gift-sunny-hills-fresh-stock-taiwan-food-pineapple-cake.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 306,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=cookie",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the product page of the {{item}}.",
|
|
"intent": "Show me the product page of the 10 oz net weight cookie.",
|
|
"instantiation_dict": {
|
|
"item": "10 oz net weight cookie"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/trader-joe-s-cookie-butter-sandwich-cookies.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 101,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 307,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=6&q=ice+cream",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the product page of the {{item}}.",
|
|
"intent": "Show me the product page of the 1.6 oz net weight ice cream.",
|
|
"instantiation_dict": {
|
|
"item": "1.6 oz net weight ice cream"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/joy-mini-cups-miniature-ice-cream-cones-for-kids-desserts-cupcake-cones-cake-pops-42-count-1-box-42-cones.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 101,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 308,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=pretzel",
|
|
"geolocation": null,
|
|
"intent_template": "Show me the product page of the {{item}}.",
|
|
"intent": "Show me the product page of the pretzels which says 1.8 pounds net weight on its packaging.",
|
|
"instantiation_dict": {
|
|
"item": "pretzels which says 1.8 pounds net weight on its packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/lalees-blueberry-yogurt-pretzels-approx-1-3-pounds-yogurt-covered-pretzels-gourmet-pretzels.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 101,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 309,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 430,
|
|
"height": 932
|
|
},
|
|
"intent_template": "Please show me the product page for the item in the {{row}} row, {{column}} column.",
|
|
"intent": "Please show me the product page for the item in the third row, first column.",
|
|
"instantiation_dict": {
|
|
"row": "third",
|
|
"column": "first"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/so-delicious-dairy-free-cocowhip-light-vegan-non-gmo-project-verified-9-oz-tub.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 102,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 310,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household.html",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 844,
|
|
"height": 393
|
|
},
|
|
"intent_template": "Please show me the product page for the item in the {{row}} row, {{column}} column.",
|
|
"intent": "Please show me the product page for the item in the second row, first column.",
|
|
"instantiation_dict": {
|
|
"row": "second",
|
|
"column": "first"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/lr1130-ag10-battery-1-5v-long-lasting-alkaline-button-cell-batteries-20-batteries-5-year-warranty.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 102,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 311,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 896,
|
|
"height": 414
|
|
},
|
|
"intent_template": "Tell me the price of the {{product}} in the {{location}}.",
|
|
"intent": "Tell me the price of the item in the fourth row, second column.",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"location": "fourth row, second column"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "There is no fourth row.",
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 18,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 312,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 1280
|
|
},
|
|
"intent_template": "Please show me the product page for the item in the {{row}} row, {{column}} column.",
|
|
"intent": "Please show me the product page for the item in the second row, second column.",
|
|
"instantiation_dict": {
|
|
"row": "second",
|
|
"column": "second"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/q-mixers-premium-ginger-ale-real-ingredients-less-sweet-6-7-fl-oz-24-bottles.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 102,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 313,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen.html",
|
|
"geolocation": null,
|
|
"viewport_size": {
|
|
"width": 430,
|
|
"height": 932
|
|
},
|
|
"intent_template": "Please add the item in the {{row}} row, {{column}} column to the shopping cart.",
|
|
"intent": "Please add the item in the third row, second column to the shopping cart.",
|
|
"instantiation_dict": {
|
|
"row": "third",
|
|
"column": "second"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wood Storage Bench Homes Collection w/2 Drawers, Wicker Storage Bench Entryway Bench with Removable Basket & Cushion, Fully Assembled Shoe Bench for Hallway Entryway Living Room (Espresso)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 103,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 314,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=adapter",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}}.",
|
|
"intent": "Find me an adapter to connect these devices from the two images from this page.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/914915/pexels-photo-914915.jpeg",
|
|
"https://images.pexels.com/photos/2047905/pexels-photo-2047905.jpeg"
|
|
],
|
|
"instantiation_dict": {
|
|
"item": "an adapter to connect these devices from the two images from this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/adapters-for-macbook-pro-usb-hdmi-adapter-multiport-usb-c-hub-macbook-pro-adapter-dongle-7-in-2-macbook-pro-usb-c-docking-station-dual-monitor-hdmi-adapter-with-dual-hdmi-2-usb-3-0-tf-sd-usb-c-100w.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 104,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 315,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=usb+c",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}}.",
|
|
"intent": "Find me an adapter to connect these devices from the two images from this page.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/1738642/pexels-photo-1738642.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/434346/pexels-photo-434346.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"item": "an adapter to connect these devices from the two images from this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/usb-c-hub-hdmi-adapter-for-macbook-pro-multi-ports-mac-dongle-with-4k-usb-c-to-hdmi-7-in-1-usb-c-hub-usb-c-to-hdmi-sd-tf-card-reader-3-usb-3-0-and-usb-c-power-pass-through-port-adapters.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 104,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 316,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=coke",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}}.",
|
|
"intent": "Tell me the price of the 30 oz coke.",
|
|
"instantiation_dict": {
|
|
"product": "30 oz coke"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "There is no 30oz coke.",
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 19,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 317,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=beer",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}}.",
|
|
"intent": "Tell me the price of the 18 oz beer.",
|
|
"instantiation_dict": {
|
|
"product": "18 oz beer"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "There is no 18oz beer.",
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 19,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 318,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=USB+C+HUB%2C+7+in+1",
|
|
"geolocation": null,
|
|
"intent_template": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"intent": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/2148216/pexels-photo-2148216.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/415043/pexels-photo-415043.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"USB C Hub Ethernet, 7 in 1 Type C Hub Multiport Adapter Desk Mount USB Docking Station, with 3 USB3.0, USB2.0, 1Gbps Ethern and SD/TF Card Reader, Clamp Design for iMac, Desktop, Computer, Table Edge",
|
|
"USB Docking Station Giq USB C hub USB 3.0 to Dual HDMI VGA Adapter Triple Display USB C Laptop Docking Station Dual Display Compatible with MacBook M1 USB Dock"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 105,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping",
|
|
"wikipedia"
|
|
],
|
|
"task_id": 319,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=type+c+to+3.5",
|
|
"geolocation": null,
|
|
"intent_template": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"intent": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"image": [
|
|
"__WIKIPEDIA__/wikipedia_en_all_maxi_2022-05/I/Galaxy_Z_Flip.jpg.webp",
|
|
"__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B06XWXR6M9.0.jpg"
|
|
],
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"USB Type C to 3.5mm Headphone and Charger Adapter, 2-in-1 USB C to 3.5 mm Audio Jack PD Fast Charging Aux Cable Compatible with Samsung Galaxy S21 S20+ S20 Fe S10 Note 20 Ultra 10 Plus, Pixel 3 4 XL"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 105,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 320,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html",
|
|
"geolocation": null,
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07CM3LVT2.0.jpg",
|
|
"intent_template": "Add {{quantity}} of {{item}} from this page to my shopping cart.",
|
|
"intent": "Add enough to have 48 bars of the item that most looks like the image from this page to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"quantity": "enough to have 48 bars",
|
|
"item": "the item that most looks like the image"
|
|
},
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => {try {return Array.from(document.querySelectorAll('.item-info')).find(el => el.textContent.includes('Protein Wafer Peanut Butter - Box of 12 Bars, Peanut Butter, 12 Count')).querySelector('input').getAttribute('data-item-qty')} catch (e) {return ' '}})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"4"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 96,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/protein-wafer-peanut-butter-box-of-12-bars-peanut-butter-12-count.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 321,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6734161/pexels-photo-6734161.jpeg",
|
|
"intent_template": "Add {{quantity}} of {{item}} from this page to my shopping cart.",
|
|
"intent": "Add enough to have 400 of the cookies that most looks like the image from this page to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"quantity": "enough to have 400",
|
|
"item": "the cookies that most looks like the image"
|
|
},
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart/",
|
|
"locator": "lambda:(() => {try {return Array.from(document.querySelectorAll(\".item-info\")).find(el => el.textContent.includes(\"Annie's Organic 20 Piece Grabbits Chocolate Mint Sandwich Cookies, 8.06 Ounce (Pack of 10)\")).querySelector(\"input\").getAttribute(\"data-item-qty\")} catch (e) {return \" \"}})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"2"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 96,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/annie-s-organic-20-piece-grabbits-chocolate-mint-sandwich-cookies-8-06-ounce-pack-of-10.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 322,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=vacuum",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6617538/pexels-photo-6617538.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "I want to buy this specific item, but only if it's brand new. Can you add one from this page to my cart?",
|
|
"intent": "I want to buy this specific item, but only if it's brand new. Can you add one from this page to my cart?",
|
|
"instantiation_dict": {},
|
|
"require_reset": true,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "The vaccum cleaner is not brand new",
|
|
"reference_answer_raw_annotation": "The vaccum cleaner is not brand new"
|
|
},
|
|
"intent_template_id": 106,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 323,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=2&q=switch",
|
|
"geolocation": null,
|
|
"intent_template": "Tell me the price of the {{product}}.",
|
|
"intent": "Tell me the price of the purple drink on this page.",
|
|
"instantiation_dict": {
|
|
"product": "purple drink on this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "There is no purple drink on the page.",
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 19,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 324,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=screen+protector",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/12741170/pexels-photo-12741170.jpeg",
|
|
"intent_template": "Tell me the price of the {{product}}.",
|
|
"intent": "Tell me the price of the items on this page that are compatible with this phone brand.",
|
|
"instantiation_dict": {
|
|
"product": "items on this page that are compatible with this phone brand"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"9.99",
|
|
"8.49"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": []
|
|
},
|
|
"intent_template_id": 19,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": "__SHOPPING__/fotbor-for-iphone-xr-iphone-11-screen-protector-privacy-tempered-glass-film-2-pack-iphone-11-privacy-screen-protector-iphone-xr-privacy-screen-protector-anti-spy-easy-install-case-friendly-6-1-inch.html and __SHOPPING__/mkeke-compatible-with-iphone-11-pro-max-screen-protector-iphone-xs-max-screen-protector-tempered-glass-3-pack-6-5.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 325,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/5082559/pexels-photo-5082559.jpeg",
|
|
"intent_template": "Purchase the cheapest {{item}}, in {{color}}.",
|
|
"intent": "Purchase the cheapest item that closely resembles the item on the right in the image, in blue.",
|
|
"instantiation_dict": {
|
|
"item": "item that closely resembles the item on the right in the image",
|
|
"color": "blue"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09443ZWQD",
|
|
"Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 107,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/wireless-mouse-3-adjustable-dpi-innovative-stylish-portable-gaming-mouse-suitable-for-notebook-pc-computer-office-home-work.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 326,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/18966448/pexels-photo-18966448.jpeg",
|
|
"intent_template": "Purchase the cheapest {{item}}, in {{color}}.",
|
|
"intent": "Purchase the cheapest headphones that has the same brand as the one in the image, in blue.",
|
|
"instantiation_dict": {
|
|
"item": "headphones that has the same brand as the one in the image",
|
|
"color": "blue"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08KKW2ZS2",
|
|
"Mint"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 107,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/logitech-g335-wired-gaming-headset-with-flip-to-mute-microphone-3-5mm-audio-jack-memory-foam-earpads-lightweight-compatible-with-pc-playstation-xbox-nintendo-switch-mint.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 327,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/8534088/pexels-photo-8534088.jpeg",
|
|
"intent_template": "Purchase the cheapest {{item}}, in {{color}}.",
|
|
"intent": "Purchase the cheapest item that has the same functionality as this, in black.",
|
|
"instantiation_dict": {
|
|
"item": "item that has the same functionality as this",
|
|
"color": "black"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09RB14X4D",
|
|
"Black"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 107,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/wireless-earbuds-mics-call-noise-canceling-wireless-charging-case-bluetooth-5-0-headset-wireless-earphones-mini-earbuds-stereo-headphones-white.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 328,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07X9SC7PW.0.jpg",
|
|
"intent_template": "Buy {{item}} while minimizing costs.",
|
|
"intent": "Buy eight batteries of the same type as shown in the image while minimizing costs.",
|
|
"instantiation_dict": {
|
|
"item": "eight batteries of the same type as shown in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B001B826IY",
|
|
"2.40"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 108,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/gp-batteries-30310-battery-alkaline-aaa.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 329,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/1433191/pexels-photo-1433191.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "Buy {{item}} while minimizing costs.",
|
|
"intent": "Buy 40 sheet of films as shown in the image while minimizing costs.",
|
|
"instantiation_dict": {
|
|
"item": "40 sheet of films as shown in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B073W8MFP9",
|
|
"25.98"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 108,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/fujifilm-instax-mini-photo-camera-film-pack.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 330,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/2634435/pexels-photo-2634435.jpeg",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy the cheapest camera of the exact same model as the image, in the same color.",
|
|
"instantiation_dict": {
|
|
"item": "the cheapest camera of the exact same model as the image,",
|
|
"condition": "in the same color"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07429BS32",
|
|
"Ice Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/fujifilm-instax-mini-9-instant-camera-cobalt-blue-with-2-x-instant-twin-film-pack-40-exposures.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 331,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/3292366/pexels-photo-3292366.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "Purchase the exact item shown in the image.",
|
|
"intent": "Purchase the exact item shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Sony",
|
|
"Alpha A7 II"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 110,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/sony-alpha-a7-ii-digital-camera-body-with-sonnar-t-fe-55mm-f-1-8-za-lens-64gb-card-battery-charger-case-tripod-kit.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 332,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/7789217/pexels-photo-7789217.jpeg",
|
|
"intent_template": "Purchase the exact item shown in the image.",
|
|
"intent": "Purchase the exact item shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Canon",
|
|
"EOS R6"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 110,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "__SHOPPING__/canon-eos-r6-mirrorless-digital-camera-body-bundle-128gb-memory-case-tripod-18pc-bundle.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 333,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/2378138/pexels-photo-2378138.jpeg",
|
|
"intent_template": "Purchase the exact item shown in the image.",
|
|
"intent": "Purchase the exact item shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "This item does not exist on OneStopMarket.",
|
|
"reference_url": "",
|
|
"program_html": []
|
|
},
|
|
"intent_template_id": 110,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 334,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/18943585/pexels-photo-18943585.jpeg",
|
|
"intent_template": "Purchase the exact item shown in the image.",
|
|
"intent": "Purchase the exact item shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "This item does not exist on OneStopMarket.",
|
|
"reference_url": "",
|
|
"program_html": []
|
|
},
|
|
"intent_template_id": 110,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 335,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6347514/pexels-photo-6347514.jpeg",
|
|
"intent_template": "Buy me {{item}} to {{address}}.",
|
|
"intent": "Buy me a chocolate ice cream to the address same as the label shown in the image. My phone number is also (650) 555-0111 in case it is needed.",
|
|
"instantiation_dict": {
|
|
"item": "a chocolate ice cream",
|
|
"address": "the address same as the label shown in the image. My phone number is also (650) 555-0111 in case it is needed"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"chocolate",
|
|
"ice cream"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".box-order-shipping-address\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"123 Bloome Street",
|
|
"Manhattan, New York, 12112"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 111,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": "This task requires OCR."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 336,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6347909/pexels-photo-6347909.jpeg",
|
|
"intent_template": "Buy me {{item}} to {{address}}.",
|
|
"intent": "Buy me the cheapest color photo printer (from the \"Printers & Accessories\") category to Emily's place as shown in the image. My phone number is also (650) 555-0111 in case it is needed..",
|
|
"instantiation_dict": {
|
|
"item": "the cheapest color photo printer (from the \"Printers & Accessories\") category",
|
|
"address": "Emily's place as shown in the image. My phone number is also (650) 555-0111 in case it is needed."
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B005TI2Q6O"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".box-order-shipping-address\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"55 W89",
|
|
"Littletown",
|
|
"Manhattan, New York, 12345"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 111,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "This task requires OCR."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 337,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6348050/pexels-photo-6348050.jpeg",
|
|
"intent_template": "Buy me {{item}} to {{address}}.",
|
|
"intent": "Buy me the cheapest bike to Mars's place as shown in the image. My phone number is also (650) 555-0111 in case it is needed..",
|
|
"instantiation_dict": {
|
|
"item": "the cheapest bike",
|
|
"address": "Mars's place as shown in the image. My phone number is also (650) 555-0111 in case it is needed."
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "OneStopMarket has no bikes.",
|
|
"reference_url": "",
|
|
"program_html": []
|
|
},
|
|
"intent_template_id": 111,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "OneStopMarket has no bikes."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 338,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/129112/pexels-photo-129112.jpeg",
|
|
"intent_template": "Change my default shipping address to the place shown in the image.",
|
|
"intent": "Change my default shipping address to the place shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/address/",
|
|
"locator": "document.querySelector(\".box-address-shipping\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"1600 Pennsylvania Ave",
|
|
"Washington, District of Columbia, 20500",
|
|
"United States"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 112,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "It's an image of the White House."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 339,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/19047616/pexels-photo-19047616.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "Change my default shipping address to the place shown in the image.",
|
|
"intent": "Change my default shipping address to the place shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/address/",
|
|
"locator": "document.querySelector(\".box-address-shipping\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"1 Kinkakuji",
|
|
"Kyoto",
|
|
"Japan"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 112,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "It's an image of the Kinkaku-ji. Actual address is sometimes in Japanese, so address eval only checks for the first part."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 340,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/2071882/pexels-photo-2071882.jpeg",
|
|
"intent_template": "Change my default shipping address to the place shown in the image.",
|
|
"intent": "Change my default shipping address to the place shown in the image.",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"string_note": "This image does not have a shipping address.",
|
|
"reference_url": "",
|
|
"program_html": []
|
|
},
|
|
"intent_template_id": 112,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 341,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/11559638/pexels-photo-11559638.jpeg",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy a CPU which is compatible with the motherboard in the image.",
|
|
"instantiation_dict": {
|
|
"item": "a CPU",
|
|
"condition": "which is compatible with the motherboard in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08X6NXNX7",
|
|
"323.99"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".item-options\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Processor 8 Cores"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/intelr-coretm-i7-11700kf-desktop-processor-8-cores-up-to-5-0-ghz-unlocked-lga1200-intelr-500-series-select-400-series-chipset-125w.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 342,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/18338406/pexels-photo-18338406.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy a motherboard which has the same CPU socket as the motherboard in the image.",
|
|
"instantiation_dict": {
|
|
"item": "a motherboard",
|
|
"condition": "which has the same CPU socket as the motherboard in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09J1S2LDS",
|
|
"294.99"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/asus-tuf-gaming-z690-plus-wifi-d4-lga1700-intel-12th-gen-atx-gaming-motherboard-pcie-5-0-ddr4-4xm-2-nvme-ssd-14-2-power-stages-wifi-6-2-5gb-lan-front-usb-3-2-gen-2-type-c-thunderbolt-4-argb-headers.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 343,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/3665444/pexels-photo-3665444.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy a desktop computer which has a CPU of the same brand as the CPU in the image.",
|
|
"instantiation_dict": {
|
|
"item": "a desktop computer",
|
|
"condition": "which has a CPU of the same brand as the CPU in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"AMD",
|
|
"Desktop |OR| PC"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 344,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/4705617/pexels-photo-4705617.jpeg",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy the cheapest battery which is the same type as the boy is holding in the image.",
|
|
"instantiation_dict": {
|
|
"item": "the cheapest battery",
|
|
"condition": "which is the same type as the boy is holding in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B002M6WY72",
|
|
"8.59"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "__SHOPPING__/petsafe-9-volt-replacement-alkaline-battery-compatible-with-petsafe-9v-battery-operated-products-pac11-12067.html"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping",
|
|
"wikipedia"
|
|
],
|
|
"task_id": 345,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__ |AND| __WIKIPEDIA__/wikipedia_en_all_maxi_2022-05/I/Country_calling_codes_map.svg.png.webp",
|
|
"geolocation": null,
|
|
"image": null,
|
|
"intent_template": "Prepend the country code of {{country}} to the phone number of my account profile.",
|
|
"intent": "Prepend the country code of South Korea to the phone number of my account profile.",
|
|
"instantiation_dict": {
|
|
"country": "South Korea"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/address/",
|
|
"locator": "document.querySelector(\".box-address-billing > div.box-content > address > a\").outerText.substring(0, 3)",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"82 |OR| +82"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 113,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 346,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/777059/pexels-photo-777059.jpeg",
|
|
"intent_template": "Prepend the country code of {{country}} to the phone number of my account profile.",
|
|
"intent": "Prepend the country code of the country shown in the image to the phone number of my account profile.",
|
|
"instantiation_dict": {
|
|
"country": "the country shown in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/address/",
|
|
"locator": "document.querySelector(\".box-address-billing > div.box-content > address > a\").outerText.substring(0, 3)",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"65 |OR| +65"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 113,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": "Singapore +65"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 347,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/5967048/pexels-photo-5967048.jpeg",
|
|
"intent_template": "Prepend the country code of {{country}} to the phone number of my account profile.",
|
|
"intent": "Prepend the country code of the country of the map show in the image to the phone number of my account profile.",
|
|
"instantiation_dict": {
|
|
"country": "the country of the map show in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/customer/address/",
|
|
"locator": "document.querySelector(\".box-address-billing > div.box-content > address > a\").outerText.substring(0, 2)",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"7 |OR| +7"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 113,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "Russia +7"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 348,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=travel+adapter",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/16075421/pexels-photo-16075421.jpeg",
|
|
"intent_template": "Empty my cart first and add all the items (in any color) from this page to my shopping cart which {{condition}}.",
|
|
"intent": "Empty my cart first and add all the items (in any color) from this page to my shopping cart which is compatible with the socket in the image.",
|
|
"instantiation_dict": {
|
|
"condition": "is compatible with the socket in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Key Power 230-Watt Step Down 220V to 110V Voltage Converter & International Travel Adapter",
|
|
"USB Charger, Charging Block CIQILY 5-Pack 1A/5V USB Power Home Travel Adapter Wall Charger Cube Brick Box Base Head Compatible for Phone X 8 7 6 Plus 5S, iPad, Samsung, LG, Moto,Tablet, Android Phone",
|
|
"OEM HTC USB Travel Charger Adapter U250 / CNR6300 / 79H00095-14M",
|
|
"Universal Power Supply Notebook Laptop Charger 120 W car Home Laptop Adapter Plug for car/Home/Travel with overheating/Overload/Short Circuit Protection US Plug",
|
|
"SCOOFEX Universal Travel Adapter, International Power Electric Outlet Converters with USB Ports - Wall Charger AC Plug Type C Type A Type G Type I for US/EU/UK/AU/Asia/China/Japan 150+Countries",
|
|
"130.73 |OR| 118.74"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 114,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "MacBook Charger Case Cover is ambiguous: it's actually a case, which is why we consider both 130.73 or 118.74 to be correct."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 349,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?q=travel+adapter",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6987724/pexels-photo-6987724.jpeg",
|
|
"intent_template": "Empty my cart first and add all the items (in any color) from this page to my shopping cart which {{condition}}.",
|
|
"intent": "Empty my cart first and add all the items (in any color) from this page to my shopping cart which is compatible with the socket in the image.",
|
|
"instantiation_dict": {
|
|
"condition": "is compatible with the socket in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Key Power 230-Watt Step Down 220V to 110V Voltage Converter & International Travel Adapter/Power Converter with Type C Port 18W - [Use for USA Appliance Overseas in Europe, AU, UK, Ireland, etc.]",
|
|
"Europe Travel Adapter, Ceptics Ultra Compact Dual USB Power Plug - for European Type C - 3 Inputs - iPhone, Laptop, Galaxy, Cell Phones, Camera Chargers, iWatch & More - CTU-9C",
|
|
"SCOOFEX Universal Travel Adapter, International Power Electric Outlet Converters with USB Ports - Wall Charger AC Plug Type C Type A Type G Type I for US/EU/UK/AU/Asia/China/Japan 150+Countries",
|
|
"74.15"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 114,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 350,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=+screwdriver#",
|
|
"geolocation": null,
|
|
"image": "https://images.pexels.com/photos/6208704/pexels-photo-6208704.jpeg",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy a screwdriver which is compatible with the screw in the image from this page.",
|
|
"instantiation_dict": {
|
|
"item": "a screwdriver",
|
|
"condition": "which is compatible with the screw in the image from this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0968D6PC1"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 351,
|
|
"require_login": false,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=+screwdriver#",
|
|
"geolocation": null,
|
|
"image": "__WIKIPEDIA__/wikipedia_en_all_maxi_2022-05/I/LR44_Button_Cell_Battery_IEC_Standard_Version.jpg.webp",
|
|
"intent_template": "Buy {{item}} {{condition}}.",
|
|
"intent": "Buy a battery with the same size and voltage as the image.",
|
|
"instantiation_dict": {
|
|
"item": "a battery",
|
|
"condition": "with the same size and voltage as the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"LR44"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 109,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 352,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/?q=iphone+to+3.5",
|
|
"geolocation": null,
|
|
"intent_template": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"intent": "Please add to my shopping cart all the items from this page that can connect these devices from the two images.",
|
|
"image": [
|
|
"https://images.pexels.com/photos/14666017/pexels-photo-14666017.jpeg",
|
|
"__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B06XWXR6M9.0.jpg"
|
|
],
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"[Apple MFi Certified] Headphone Adapter for iPhone, Belcompany 2 Pack Lightning to 3.5mm AUX Earphone Audio Stereo Converter Compatible with iPhone 13/12/11/XS/XR/X/iPad, Support Call & Music Control"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 105,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 353,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry.html?p=12",
|
|
"geolocation": null,
|
|
"intent_template": "I really like these {{product}}, but I am not satisfied with the color. Could you find me an item on this page for these {{product}} with a {{shadeChoice}} shade or color?",
|
|
"intent": "I really like these shoes, but I am not satisfied with the color. Could you find me an item on this page for these shoes with a darker shade or color?",
|
|
"image": "https://images.pexels.com/photos/3636684/pexels-photo-3636684.jpeg",
|
|
"instantiation_dict": {
|
|
"product": "shoes",
|
|
"shadeChoice": "darker"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/vans-old-skool-black-white-skate-vn-0d3hy28-mens-us-9-5-uk-8-5-eur-42-5.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 115,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 354,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that are of the same brand as the product in this picture. It needs to {{description}}.",
|
|
"intent": "Find me shoes that are of the same brand as the product in this picture. It needs to be less than 70 dollars.",
|
|
"image": "https://images.pexels.com/photos/14544746/pexels-photo-14544746.jpeg",
|
|
"instantiation_dict": {
|
|
"category": "shoes",
|
|
"description": "be less than 70 dollars"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { res = parseFloat(document.querySelector(\"#maincontent > div.columns > div > div.product-info-main > div.product-info-price > div.price-box.price-final_price > span > span\").outerText.substr(1)); return res ? res : 0; })()",
|
|
"required_contents": {
|
|
"required_values": [
|
|
"< 70"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "lambda:(() => { try { return document.querySelector('#maincontent > div.page-title-wrapper.product > h1 > span').textContent } catch (e) { return '' }})()",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Croc"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 116,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 355,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find an image address of a {{product}} with their logo that I can wear to support them?",
|
|
"intent": "I am a fan of the Minnesota Vikings. Can you find an image address of a shirt with their logo that I can wear to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Minnesota Vikings",
|
|
"product": "shirt"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07BCKK3HS.0.jpg |OR| B07BCKK3HS.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07BCKK3HS.0.jpg"
|
|
},
|
|
"intent_template_id": 117,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 356,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html?p=16",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{category}} that is of the same brand as the product in this image. It needs to {{description}}.",
|
|
"intent": "Find me a hoodie that is of the same brand as the product in this image. It needs to have the brand logo in multicolor.",
|
|
"image": "https://images.pexels.com/photos/3819969/pexels-photo-3819969.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"category": "a hoodie",
|
|
"description": "have the brand logo in multicolor"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"url_match"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "__SHOPPING__/coca-cola-horizon-stripe-logo-men-s-hooded-sweatshirt-white.html",
|
|
"program_html": [],
|
|
"url_note": "EXACT"
|
|
},
|
|
"intent_template_id": 118,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 357,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=10&q=socks",
|
|
"geolocation": null,
|
|
"intent_template": "I want {{product}} that are {{colors}}. Can you find an image address of {{target}}?",
|
|
"intent": "I want socks that are green. Can you find an image address of green socks from this page?",
|
|
"instantiation_dict": {
|
|
"product": "socks",
|
|
"colors": "green",
|
|
"target": "green socks from this page"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07BD2CV35.0.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B07BD2CV35.0.jpg"
|
|
},
|
|
"intent_template_id": 119,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 358,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=6&q=korean",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy snacks with a cute animal on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "snacks",
|
|
"detail": "a cute animal"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B094C9G7G2"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 359,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/food-beverage-gifts/snack-gifts.html?p=14",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}} on the packaging (in any size).",
|
|
"intent": "Buy the snacks with horses on the packaging (in any size).",
|
|
"instantiation_dict": {
|
|
"product": "snacks",
|
|
"detail": "horses"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0095MWPB6"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 121,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 360,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/food-beverage-gifts/snack-gifts.html?p=23",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}} on the packaging (in any size).",
|
|
"intent": "Buy the snacks with a tiger on the packaging (in any size).",
|
|
"instantiation_dict": {
|
|
"product": "snacks",
|
|
"detail": "a tiger"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08LBRN17G"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 121,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 361,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/snacks-sweets.html?p=8",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}} on the packaging (in any size).",
|
|
"intent": "Buy the snacks with an owl on the packaging (in any size).",
|
|
"instantiation_dict": {
|
|
"product": "snacks",
|
|
"detail": "an owl"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B086RKGJPR"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 121,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 362,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/sport-specific-clothing.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the shorts with a graphic print of a clock.",
|
|
"instantiation_dict": {
|
|
"product": "shorts",
|
|
"detail": "a graphic print of a clock"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B093BSCCZ7"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 363,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/clothing-shoes-jewelry/men/clothing.html?p=13",
|
|
"geolocation": null,
|
|
"intent_template": "Given the image, buy the {{product}} which contain the same object in the image on its design.",
|
|
"intent": "Given the image, buy the shorts which contain the same object in the image on its design.",
|
|
"instantiation_dict": {
|
|
"product": "shorts"
|
|
},
|
|
"image": "https://images.pexels.com/photos/1108099/pexels-photo-1108099.jpeg?auto=compress&cs=tinysrgb&w=800",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09S3QYWJQ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 123,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 364,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/exercise-fitness.html?p=6",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find an image address of a {{product}} with their logo that I can wear to support them?",
|
|
"intent": "I am a fan of the Green Bay Packers. Can you find an image address of a shirt with their logo that I can wear to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Green Bay Packers",
|
|
"product": "shirt"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no Packers shirts available on this page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 117,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 365,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/home-kitchen.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the TV with the animal from the image on its display.",
|
|
"instantiation_dict": {
|
|
"product": "TV",
|
|
"detail": "the animal from the image on its display"
|
|
},
|
|
"image": "https://images.pexels.com/photos/17581924/pexels-photo-17581924/free-photo-of-orca-in-zoo.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B089GT7Z5Z"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 366,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the controller with the cherry blossom design.",
|
|
"instantiation_dict": {
|
|
"product": "controller",
|
|
"detail": "the cherry blossom design"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08N1FRB5X"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 367,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}} on the packaging (in any size).",
|
|
"intent": "Buy the item with the tomato on the packaging (in any size).",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "the tomato"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B001B2SNC8"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 121,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 368,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cell-phones.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}} on the display image (in any color).",
|
|
"intent": "Buy the phone with the skateboarder on the display image (in any color).",
|
|
"instantiation_dict": {
|
|
"product": "phone",
|
|
"detail": "the skateboarder"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B096RX86Y2"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 124,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 369,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that {{relation}} in the image{{detail}}.",
|
|
"intent": "Buy me a phone (from the \"Cell Phones\" category) that looks the most like the items in the image.",
|
|
"image": "https://images.pexels.com/photos/159644/art-supplies-brushes-rulers-scissors-159644.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "phone (from the \"Cell Phones\" category)",
|
|
"relation": "looks the most like the items",
|
|
"detail": ""
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07NSB9ZTZ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 125,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 370,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that {{relation}} in the image{{detail}}.",
|
|
"intent": "Buy me a phone (from the \"Cell Phones\" category) that looks the most like the items in the image.",
|
|
"image": "https://images.pexels.com/photos/3954444/pexels-photo-3954444.png?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "phone (from the \"Cell Phones\" category)",
|
|
"relation": "looks the most like the items",
|
|
"detail": ""
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07NVKVYZR"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 125,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 371,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Search for \"{{term}}\" and buy me a {{product}} with {{detail}}.",
|
|
"intent": "Search for \"hoodie\" and buy me a hoodie (in any color) with a jack-o-lantern design for less than 10 dollars.",
|
|
"instantiation_dict": {
|
|
"term": "hoodie",
|
|
"product": "hoodie (in any color)",
|
|
"detail": "a jack-o-lantern design for less than 10 dollars"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09G2YFQHF"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 126,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 372,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that {{relation}} in the image{{detail}}.",
|
|
"intent": "Buy me a charging cable (from the \"Chargers & Power Adapters\" category) in any color that looks the most like the items in the image.",
|
|
"image": "https://images.pexels.com/photos/10593653/pexels-photo-10593653.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "charging cable (from the \"Chargers & Power Adapters\" category) in any color",
|
|
"relation": "looks the most like the items",
|
|
"detail": ""
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B081WY776W"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 125,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 373,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "What is the color of the {{type}} item in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"type": "cheapest car charger",
|
|
"product_category": "Chargers & Power Adapters"
|
|
},
|
|
"intent": "What is the color of the cheapest car charger item in the \"Chargers & Power Adapters\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"black"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "black"
|
|
},
|
|
"intent_template_id": 6,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 374,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} with {{detail}}.",
|
|
"intent": "Buy me a phone case (from the \"Basic Cases\" category) with a Barbie theme between 12-14 dollars.",
|
|
"instantiation_dict": {
|
|
"product": "phone case (from the \"Basic Cases\" category)",
|
|
"detail": "a Barbie theme between 12-14 dollars"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09NJKPD3N"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 127,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 375,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} with {{detail}}.",
|
|
"intent": "Buy me a pink phone case for my iPhone 11 6.1\" with a Stitch graphic from the \"Basic Cases\" category.",
|
|
"instantiation_dict": {
|
|
"product": "pink phone case for my iPhone 11 6.1\"",
|
|
"detail": "a Stitch graphic from the \"Basic Cases\" category"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07Q17MK1F",
|
|
"iPhone 11 6.1"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 127,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 376,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} with {{detail}}.",
|
|
"intent": "Buy me a black phone case (from the \"Basic Cases\" category) with a Pikachu graphic.",
|
|
"instantiation_dict": {
|
|
"product": "black phone case (from the \"Basic Cases\" category)",
|
|
"detail": "a Pikachu graphic"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09Q2B4X8S"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 127,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 377,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} with {{detail}}.",
|
|
"intent": "Buy me a red phone case with an Iron Man graphic.",
|
|
"instantiation_dict": {
|
|
"product": "red phone case",
|
|
"detail": "an Iron Man graphic"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07P9R993T",
|
|
"Red"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 127,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 378,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find a url of an image of an item in the \"{{product_category}}\" category I can buy to support them?",
|
|
"intent": "I am a fan of the Atlanta Falcons. Can you find a url of an image of an item in the \"Playstation 4\" category I can buy to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Atlanta Falcons",
|
|
"product_category": "Playstation 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no Falcons items available in this category.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 128,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 379,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find a url of an image of an item in the \"{{product_category}}\" category I can buy to support them?",
|
|
"intent": "I am a fan of the Cleveland Browns. Can you find a url of an image of an item in the \"Playstation 4\" category I can buy to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Cleveland Browns",
|
|
"product_category": "Playstation 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no Browns items available in this category.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 128,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 380,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find a url of an image of an item in the \"{{product_category}}\" category I can buy to support them?",
|
|
"intent": "I am a fan of the Buffalo Bills. Can you find a url of an image of an item in the \"Playstation 4\" category I can buy to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Buffalo Bills",
|
|
"product_category": "Playstation 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no Bills items available in this category.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 128,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 381,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "I am a fan of {{organization}}. Can you find a url of an image of an item in the \"{{product_category}}\" category I can buy to support them?",
|
|
"intent": "I am a fan of the Miami Dolphins. Can you find a url of an image of an item in the \"Playstation 4\" category I can buy to support them?",
|
|
"instantiation_dict": {
|
|
"organization": "the Miami Dolphins",
|
|
"product_category": "Playstation 4"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"must_include": [
|
|
"B07583CVJW.0.jpg |OR| B07583CVJW.1.jpg"
|
|
]
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "",
|
|
"reference_answer_raw_annotation": "__SHOPPING__/media/catalog/product/cache/89ff578b9cd87e0600daac45c9e1ea98/B/0/B07583CVJW.0.jpg"
|
|
},
|
|
"intent_template_id": 128,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 382,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/xbox-one.html?p=9",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the controller (in any color) on the page with a black gradient.",
|
|
"instantiation_dict": {
|
|
"product": "controller (in any color)",
|
|
"detail": "with a black gradient"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B075JFXXTM"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 383,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/xbox-one.html?p=13",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the item on the page with Rick and Morty themes.",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "with Rick and Morty themes"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B081ZNFZZJ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 384,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the item with a scared Mario Bros character in the \"Nintendo Switch\" category.",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "a scared Mario Bros character in the \"Nintendo Switch\" category"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07SK4W1VJ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 385,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "cheapest beer that comes in a box",
|
|
"product_category": "Alcoholic Beverages"
|
|
},
|
|
"intent": "Can you buy the cheapest beer that comes in a box in the \"Alcoholic Beverages\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B00PLXE90I"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 386,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "incorrectly labeled Bud Light",
|
|
"product_category": "Alcoholic Beverages"
|
|
},
|
|
"intent": "Can you buy the incorrectly labeled Bud Light in the \"Alcoholic Beverages\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B00U56P3AQ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 387,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "cheapest box wine",
|
|
"product_category": "Alcoholic Beverages"
|
|
},
|
|
"intent": "Can you buy the cheapest box wine in the \"Alcoholic Beverages\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01NBFKHYA"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 388,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/shave-hair-removal/men-s.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"instantiation_dict": {
|
|
"product": "pink trimmer for women",
|
|
"detail": ""
|
|
},
|
|
"intent": "Buy the pink trimmer for women on the page .",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08WKDNLXV"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"comments": "",
|
|
"overall_difficulty": "easy"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 389,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "most expensive item (in any size) that uses a mannequin in its display",
|
|
"product_category": "Virtual Reality (VR) Headsets"
|
|
},
|
|
"intent": "Can you buy the most expensive item (in any size) that uses a mannequin in its display in the \"Virtual Reality (VR) Headsets\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09NBRVLHN"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 390,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Rate {{product}} in the {{category}} category with {{num_star}} stars, using my nickname {{nickname}}?",
|
|
"instantiation_dict": {
|
|
"product": "the controller with a happy couple on it",
|
|
"category": "\"Legacy Systems > Xbox Systems\"",
|
|
"num_star": 5,
|
|
"nickname": "EmLo"
|
|
},
|
|
"intent": "Rate the controller with a happy couple on it in the \"Legacy Systems > Xbox Systems\" category with 5 stars, using my nickname EmLo?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating('B09P819K5N')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"100"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_author('B09P819K5N')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"EmLo"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 131,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 391,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Rate {{product}} in the {{category}} category with {{num_star}} stars, using my nickname {{nickname}}?",
|
|
"instantiation_dict": {
|
|
"product": "the controller with a sideways display image that is not a stock photo",
|
|
"category": "\"Legacy Systems > Xbox Systems\"",
|
|
"num_star": 0,
|
|
"nickname": "EmLo"
|
|
},
|
|
"intent": "Rate the controller with a sideways display image that is not a stock photo in the \"Legacy Systems > Xbox Systems\" category with 0 stars, using my nickname EmLo?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating('B00BH4V6HE')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"0"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_author('B00BH4V6HE')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"EmLo"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 131,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 392,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "purple and blue controllers with lightning and galaxy designs",
|
|
"product_category": "Legacy Systems > Playstation Systems"
|
|
},
|
|
"intent": "Can you buy the purple and blue controllers with lightning and galaxy designs in the \"Legacy Systems > Playstation Systems\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07C85HK2J",
|
|
"Blue+ Purple"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 393,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/playstation-systems.html?p=12",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the item on the page with Toys R Us on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "with Toys R Us on the packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B004DWOSTU"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 394,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/playstation-systems.html?p=14",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the PSP on the page which has a case in its display image.",
|
|
"instantiation_dict": {
|
|
"product": "PSP",
|
|
"detail": "which has a case in its display image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B000YQL3G0"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 395,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/nintendo-systems.html?p=1",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the Animal Crossing product on the page with a character showing its teeth.",
|
|
"instantiation_dict": {
|
|
"product": "Animal Crossing product",
|
|
"detail": "with a character showing its teeth"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01D92FIRK"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 396,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/nintendo-systems.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the item on the page with a pink background on the display image (in any edition).",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "with a pink background on the display image (in any edition)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B001IAP45W"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 397,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/nintendo-switch.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the item on the page with a banana theme.",
|
|
"instantiation_dict": {
|
|
"product": "item",
|
|
"detail": "with a banana theme"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0931NN4PR"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Fortnite Fleece Bundle"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 398,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/nintendo-switch.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "Given the image, buy the {{product}} which contain the same object in the image on its design.",
|
|
"intent": "Given the image, buy the item on this page (in any style) which contain the same object in the image on its design.",
|
|
"instantiation_dict": {
|
|
"product": "item on this page (in any style)"
|
|
},
|
|
"image": "https://images.pexels.com/photos/207142/pexels-photo-207142.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0786JC6VW"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 123,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 399,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/",
|
|
"geolocation": null,
|
|
"intent_template": "Can you buy the {{item}} in the \"{{product_category}}\" category?",
|
|
"instantiation_dict": {
|
|
"item": "cheapest cereal with a graphic character on the box",
|
|
"product_category": "Cereals"
|
|
},
|
|
"intent": "Can you buy the cheapest cereal with a graphic character on the box in the \"Cereals\" category?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07QFH3BGS"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 130,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "medium"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 400,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/video-games/legacy-systems/nintendo-systems.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the Nunchuk controller (in any color) on the page with a shadow outline on the display image.",
|
|
"instantiation_dict": {
|
|
"product": "Nunchuk controller (in any color) on the page",
|
|
"detail": "a shadow outline on the display image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B0094X2066"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 401,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cakes.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the cake on the page with a green turtle.",
|
|
"instantiation_dict": {
|
|
"product": "cake",
|
|
"detail": "with a green turtle"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no cakes with green turtles available on this page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 402,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cakes.html?p=2",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the cakes on the page with Korean packaging.",
|
|
"instantiation_dict": {
|
|
"product": "cakes",
|
|
"detail": "with Korean packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"string_match"
|
|
],
|
|
"reference_answers": {
|
|
"fuzzy_match": "N/A"
|
|
},
|
|
"reference_url": "",
|
|
"program_html": [],
|
|
"string_note": "There are no Korean cakes on this page.",
|
|
"reference_answer_raw_annotation": "N/A"
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 403,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cakes.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the cake on the page with a kitchen countertop in the display image.",
|
|
"instantiation_dict": {
|
|
"product": "cake",
|
|
"detail": "with a kitchen countertop in the display image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07TGKXHFY"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 404,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/snacks-sweets/snack-foods.html?p=33&product_list_order=price",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} on the page {{detail}}.",
|
|
"intent": "Buy the snacks on the page with a basketball player on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "snacks",
|
|
"detail": "with a basketball player on the packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B08M1YSJ7F"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 129,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 405,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that {{relation}} in the image{{detail}}.",
|
|
"intent": "Buy me a product that has the same function as the items in the image from the \"Cereals\" category.",
|
|
"image": "https://images.pexels.com/photos/187498/pexels-photo-187498.jpeg?auto=compress&cs=tinysrgb&w=800",
|
|
"instantiation_dict": {
|
|
"product": "product",
|
|
"relation": "has the same function as the items",
|
|
"detail": " from the \"Cereals\" category"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B09JV2P5FH"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 125,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 406,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the cereal with a beach volleyball player on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "cereal",
|
|
"detail": "a beach volleyball player on the packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07J4ZTLWG"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 407,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sports-outdoors/fan-shop.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy the {{product}} with {{detail}}.",
|
|
"intent": "Buy the top on the page with Boston Celtics colors.",
|
|
"instantiation_dict": {
|
|
"product": "top on the page",
|
|
"detail": "Boston Celtics colors"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07B313S75"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 122,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 408,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that has a skyline of the city shown in this image.",
|
|
"intent": "Buy me a pair of large shorts that has a skyline of the city shown in this image.",
|
|
"image": "https://images.pexels.com/photos/3964406/pexels-photo-3964406.jpeg?auto=compress&cs=tinysrgb&w=800",
|
|
"instantiation_dict": {
|
|
"product": "pair of large shorts"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07MV1JFND",
|
|
"Large"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 132,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 409,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that has a skyline of the city shown in this image.",
|
|
"intent": "Buy me a large hoodie that has a skyline of the city shown in this image.",
|
|
"image": "https://images.pexels.com/photos/419235/pexels-photo-419235.jpeg?auto=compress&cs=tinysrgb&w=800",
|
|
"instantiation_dict": {
|
|
"product": "large hoodie"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07XT2SC56",
|
|
"Large"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 132,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 410,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that references a sports team from this city.",
|
|
"intent": "Buy me a video game controller that references a sports team from this city.",
|
|
"image": "https://images.pexels.com/photos/2539395/pexels-photo-2539395.jpeg?auto=compress&cs=tinysrgb&w=800",
|
|
"instantiation_dict": {
|
|
"product": "video game controller"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01N57KNX7"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 133,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 411,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that references the city in the image.",
|
|
"intent": "Buy me a size small shirt under 20 dollars that references the city in the image.",
|
|
"image": "https://images.pexels.com/photos/1239162/pexels-photo-1239162.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "size small shirt under 20 dollars"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07R75ZV6F"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "func:get_query_text(__page__, \"#shopping-cart-table\")",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Small"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 134,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 412,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that references a sports team from this city.",
|
|
"intent": "Buy me a pair of shorts over 50 dollars (in any size) that references a sports team from this city.",
|
|
"image": "https://images.pexels.com/photos/1239162/pexels-photo-1239162.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "pair of shorts over 50 dollars (in any size)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07MV1MZWF"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 133,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 413,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy me a {{product}} that references the city in the image.",
|
|
"intent": "Buy me a pair of small shorts under 30 dollars that references the city in the image.",
|
|
"image": "https://images.pexels.com/photos/1239162/pexels-photo-1239162.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=2",
|
|
"instantiation_dict": {
|
|
"product": "pair of small shorts under 30 dollars"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07PT4DPK2",
|
|
"Small"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 134,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 414,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/oral-care/toothbrushes-accessories.html?p=4",
|
|
"geolocation": null,
|
|
"intent_template": "Rate {{product}} in the {{category}} category with {{num_star}} stars, using my nickname {{nickname}}?",
|
|
"instantiation_dict": {
|
|
"product": "the toothbrush on this page with a cupcake on it",
|
|
"category": "Toothbrushes & Accessories",
|
|
"num_star": 5,
|
|
"nickname": "EmLo"
|
|
},
|
|
"intent": "Rate the toothbrush on this page with a cupcake on it in the Toothbrushes & Accessories category with 5 stars, using my nickname EmLo?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating('B09P55GY2P')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"100"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_author('B09P55GY2P')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"EmLo"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 131,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 415,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/oral-care/toothbrushes-accessories.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "Rate {{product}} in the {{category}} category with {{num_star}} stars, using my nickname {{nickname}}?",
|
|
"instantiation_dict": {
|
|
"product": "the toothbrush on this page with a winking character on it",
|
|
"category": "Toothbrushes & Accessories",
|
|
"num_star": 5,
|
|
"nickname": "EmLo"
|
|
},
|
|
"intent": "Rate the toothbrush on this page with a winking character on it in the Toothbrushes & Accessories category with 5 stars, using my nickname EmLo?",
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_rating('B09S3PK7R3')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"100"
|
|
]
|
|
}
|
|
},
|
|
{
|
|
"url": "last",
|
|
"locator": "func:shopping_get_sku_latest_review_author('B09S3PK7R3')",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"EmLo"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 131,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"comments": "",
|
|
"overall_difficulty": "hard"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 416,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/beauty-personal-care/personal-care/deodorants-antiperspirants.html",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy deoderant on the page with the phrase 'extra extra dry' on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "deoderant on the page",
|
|
"detail": "the phrase 'extra extra dry'"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01IADXR9E"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 417,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy the cheapest deoderant from the \"Deodorants & Antiperspirants\" category with the phrase 'killer' on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "the cheapest deoderant from the \"Deodorants & Antiperspirants\" category",
|
|
"detail": "the phrase 'killer'"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B073VBXY7L"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 418,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy the cheapest item from the \"Fragrance > Men's\" category with plastic on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "the cheapest item from the \"Fragrance > Men's\" category",
|
|
"detail": "plastic"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B07BFHHG97"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 419,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy the most expensive men's fragrance with an animal on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "the most expensive men's fragrance",
|
|
"detail": "an animal"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B01M6BJEOJ"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 420,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Buy {{product}} with {{detail}} on the packaging.",
|
|
"intent": "Buy the most expensive wine making kit with a happy couple on the packaging.",
|
|
"instantiation_dict": {
|
|
"product": "the most expensive wine making kit",
|
|
"detail": "a happy couple"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "func:shopping_get_latest_order_url()",
|
|
"locator": "document.querySelector(\".order-details-items.ordered\").outerText",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B085SPWHJS"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 120,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 421,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me to add the cheapest {{color}} {{item}} to my wishlist",
|
|
"intent": "Help me to add the cheapest purple phone stand above $8 to my wishlist",
|
|
"instantiation_dict": {
|
|
"color": "purple",
|
|
"item": "phone stand above $8"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Lazy Cell Phone Holder - Universal Phone Holder to Wear Around Neck Lazy Bracket Free Rotating Smart Mobile Phone Mount Stand",
|
|
"Purple"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 135,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 422,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me to add the cheapest {{color}} {{item}} to my wishlist",
|
|
"intent": "Help me to add the cheapest fully white women's shoes (any size) to my wishlist",
|
|
"instantiation_dict": {
|
|
"color": "fully white",
|
|
"item": "women's shoes (any size)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Cute Sandals for Women Beach Comfort Sandals Casual Daily Slip On Platform Sandals Flat Beach Shoes Dressy Slides",
|
|
"A1-white"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 135,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 423,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me to add the cheapest {{color}} {{item}} to my wishlist",
|
|
"intent": "Help me to add the cheapest white humidifier to my wishlist",
|
|
"instantiation_dict": {
|
|
"color": "white",
|
|
"item": "humidifier"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"4L Humidifiers for Bedroom - Top Fill Air Humidifier for Large Room, Auto Shut-off Cool Mist Humidifier, Essential-Oil Diffuser, LED Display, Constant Humidity, Mist Mode for Home, Office, Plants"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 135,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 424,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Please add the cheapest {{description}} {{item}} to my shopping cart",
|
|
"intent": "Please add the cheapest anime poster (from the \"Posters & Print\" category) to my shopping cart",
|
|
"instantiation_dict": {
|
|
"description": "anime",
|
|
"item": "poster (from the \"Posters & Print\" category)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"HWEMAKES Demon Slayer Poster Decorative Painting Canvas Wall Art Living Room Posters Bedroom Painting 16x24inch(40x60cm)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 136,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 425,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Please add the cheapest {{description}} {{item}} to my shopping cart",
|
|
"intent": "Please add the cheapest round smartwatch (from the \"Smartwatches\" category) to my shopping cart",
|
|
"instantiation_dict": {
|
|
"description": "round",
|
|
"item": "smartwatch (from the \"Smartwatches\" category)"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"IDEALROYAL Smart Watch,Fitness Tracker with Heart Rate Monitor,IP68 Waterproof, Blood Pressure,Sleep Monitor, Full Touch Screen Smart Watch for Women Men for Android & iOS (Pink)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 136,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 426,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Please add the cheapest {{description}} {{item}} to my shopping cart",
|
|
"intent": "Please add the cheapest standing projection screen to my shopping cart",
|
|
"instantiation_dict": {
|
|
"description": "standing",
|
|
"item": "projection screen"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"EPSELPSC80 - Duet Ultra Portable Projection Screen"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 136,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 427,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food.html?p=7",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add all the {{items}} {{condition}} to my shopping cart?",
|
|
"intent": "Can you add all the items on this page with korean words to my shopping cart?",
|
|
"instantiation_dict": {
|
|
"items": "items on this page",
|
|
"condition": "with korean words"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Tofu Broth Seasoning (Seafood)",
|
|
"NH WELLHEIM Variety Seoul Tteokbokki Hot& Spicy, Spicy Carbo, and Jjajang Flavors \"Spicy Challenge Box\" (3 COMBO, PACK OF 6)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 72,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 428,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/catalogsearch/result/index/?p=8&q=chair",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add all the {{items}} {{condition}} to my shopping cart?",
|
|
"intent": "Can you add all the items on this page with wheels to my shopping cart?",
|
|
"instantiation_dict": {
|
|
"items": "items on this page",
|
|
"condition": "with wheels"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Modern Upholstered Tufted Velvet Office Chair Adjustable Vanity Chair Makeup Chair Cute Desk Chair Mid Back Computer Chair Accent Chairs for Bedroom, Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 72,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 429,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/computers-accessories/computers-tablets.html?p=5",
|
|
"geolocation": null,
|
|
"intent_template": "Can you add all the {{items}} {{condition}} to my shopping cart?",
|
|
"intent": "Can you add all the items on this page with a stylus to my shopping cart?",
|
|
"instantiation_dict": {
|
|
"items": "items on this page",
|
|
"condition": "with a stylus"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Navitech 7\" Purple Case/Cover with 360 Rotational Stand & Stylus Pen Compatible with The Hisense Sero Pro 8 / Haier Pad Mini 7.5",
|
|
"Toshiba Dynabook Tecra A30-G 13.3\" FHD Business Laptop Computer, Celeron 5205U Processor @ 1.9GHz, 8GB DDR4 RAM, 256GB PCIe SSD, WiFi 6, Bluetooth, Type-C, Windows 10 Pro Education, 64GB Flash Drive"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 72,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 430,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me find all items between {{lower}} and {{upper}} that look like the image below and put them in my cart.",
|
|
"intent": "Help me find all items between $40 and $50 that look like the image below and put them in my cart.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B01GBZZA48.0.jpg",
|
|
"instantiation_dict": {
|
|
"lower": "$40",
|
|
"upper": "$50"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"125ft Weather Seal Quad Shield Outdoor 3GHZ RG-6 Coaxial Cable 75 Ohm (Satellite TV or Broadband Internet) Anti Corrosion Brass Connector RG6 Fittings Assembled in USA by PHAT SATELLITE INTL",
|
|
"GE RG6 Coaxial Cable, 100 ft. F-Type Connectors, Quad Shielded Coax Cable, 3 GHz Digital, In-Wall Rated, Ideal for TV Antenna, DVR, VCR, Satellite, Cable Box, Home Theater, Black, 34842",
|
|
"SiriusXM Satellite Radio 75 Foot RG6 Coaxial Cable Antenna Cable Extension Kit Works with All Sirius, XM and SiriusXM Radio Receivers and Boomboxes",
|
|
"Ucland RP-SMA Male to SMA Male Adapter Connector RG174 Coaxial Cable for Satellite Television Black 2m",
|
|
"55ft TRI-Shield 14AWG 75 Ohm Gel Coated Braid Direct Burial Underground RG-11 Coax HD Cable TV Antenna Weather Seal All Brass CONNECTORS UL ETL Cut to Order Assembled in USA",
|
|
"65ft Made in USA Plenum RG-11 Coax 3Ghz HD Cable TV Antenna 14AWG 75 Ohm All Brass CONNECTORS CMP UL ETL Anti-Static Commercial FIRE Retardant Cut to Order Assembled in USA by PHAT SATELLITE INTL",
|
|
"90ft TRI-Shield 14AWG 75 Ohm Gel Coated Braid Direct Burial Underground RG-11 Coax HD Cable TV Antenna Weather Seal All Brass CONNECTORS UL ETL Cut to Order Assembled in USA",
|
|
"75 Ft Pro Brand RG6 Coax Cable Black Solid Copper Center Conductor Digital 2.25 GHz Satellite HDTV Dish 75 Ohm Shielded Braided Satellite Dish Off-Air HDTV Aerial Antenna Video Jumper Signal",
|
|
"GE RG6 Coaxial Cable, 100 ft. F-Type Connectors, Quad Shielded Coax Cable, 3 GHz Digital, In-Wall Rated, Ideal for TV Antenna, DVR, VCR, Satellite, Cable Box, Home Theater, Black, 34842",
|
|
"Ucland RP-SMA Male to SMA Male Adapter Connector RG174 Coaxial Cable for Satellite Television Black 2m"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 137,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 431,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me find all items between {{lower}} and {{upper}} that look like the image below and put them in my cart.",
|
|
"intent": "Help me find all items between $10 and $20 that look like the image below and put them in my cart.",
|
|
"image": "https://images.pexels.com/photos/239578/pexels-photo-239578.jpeg",
|
|
"instantiation_dict": {
|
|
"lower": "$10",
|
|
"upper": "$20"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"6 Pack Assorted Macarons | Gluten Free | Almond Overload, Blueberry Cheesecake & Chocolate Raspberry",
|
|
"12 Pack | Cheesecake Combo French Macarons Value Pack"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 137,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 432,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Help me find all items between {{lower}} and {{upper}} that look like the image below and put them in my cart.",
|
|
"intent": "Help me find all items between $30 and $40 that look like the image below and put them in my cart.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07Q9QGBGV.0.jpg",
|
|
"instantiation_dict": {
|
|
"lower": "$30",
|
|
"upper": "$40"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Magic Array Wireless Charger, 10w Ultra-Thin Qi Fast Wireless Charging Pad, Compatible with iPhone X/XS/MAX/8/8 Plus/Galaxy Note 9/S9/S10/S9 Plus/Note 8/S8 Edge More (Adapter NOT Included) (Pink)",
|
|
"Magic Array Wireless Charger, 10w Ultra-Thin Qi Fast Wireless Charging Pad, Compatible with iPhone X/XS/MAX/8/8 Plus/Galaxy Note 9/S9/S10/S9 Plus/Note 8/S8 Edge More (Adapter NOT Included) (Brown)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 137,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 433,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{property}} version of the thing in this image and add it to my cart please.",
|
|
"intent": "Find me the cheapest small-packet version of the thing in this image and add it to my cart please.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B01NBY6BCJ.0.jpg",
|
|
"instantiation_dict": {
|
|
"property": "small-packet"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Evaxo Sun-Maid Raisins 24 x 1 oz .#B"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 138,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 434,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{property}} version of the thing in this image and add it to my cart please.",
|
|
"intent": "Find me the cheapest thick, original version of the thing in this image and add it to my cart please.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B07KKXXM67.0.jpg",
|
|
"instantiation_dict": {
|
|
"property": "thick, original"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"REESE'S Peanut Butter Cups, Milk Chocolate, Snack Size (Pack of 2 Pounds)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 138,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 435,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{property}} version of the thing in this image and add it to my cart please.",
|
|
"intent": "Find me the cheapest strawberry version of the thing in this image and add it to my cart please.",
|
|
"image": "__SHOPPING__/media/catalog/product/cache/829a59e57f886f8cf0598ffca4f8a940/B/0/B08L3MNSCW.1.jpg",
|
|
"instantiation_dict": {
|
|
"property": "strawberry"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Kit kat chocolate strawberry 12 bars 1 bags Japan import"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 138,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 436,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest item that costs {{range}} and can {{function}} like in the image shown and add it to my cart.",
|
|
"intent": "Find me the cheapest item that costs more than $6 and can project onto a screen like in the image shown and add it to my cart.",
|
|
"image": "https://images.pexels.com/photos/2507025/pexels-photo-2507025.jpeg",
|
|
"instantiation_dict": {
|
|
"range": "more than $6",
|
|
"function": "project onto a screen"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Sony VPL-VW1000ES 4K Home Theater ES Projector (2012 Model)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 139,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 437,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest item that costs {{range}} and can {{function}} like in the image shown and add it to my cart.",
|
|
"intent": "Find me the cheapest item that costs between $3-4 and can hold up a phone like in the image shown and add it to my cart.",
|
|
"image": "https://images.pexels.com/photos/728842/pexels-photo-728842.jpeg",
|
|
"instantiation_dict": {
|
|
"range": "between $3-4",
|
|
"function": "hold up a phone"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wireless Bluetooth Selfie Stick and Tripod Combination - Compatible for Samsung S10 Lite & Most Android/iOS Smart Phones"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 139,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 438,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Navigate to the category where this image is most likely to be found. Then, find me the cheapest item that costs {{range}} and can {{function}} like in the image shown and add it to my cart.",
|
|
"intent": "Navigate to the category where this image is most likely to be found. Then, find me the cheapest item that costs more than $5 and can charge multiple devices like in the image shown and add it to my cart.",
|
|
"image": "https://images.pexels.com/photos/8101107/pexels-photo-8101107.jpeg",
|
|
"instantiation_dict": {
|
|
"range": "more than $5",
|
|
"function": "charge multiple devices"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Philips 6-Outlet Extender Surge Protector, 3-Prong, Wall Adapter Plug, Space Saving Design, 1020J, UL Listed, White, SPS1006WA/37 |OR| J.VOLT 4 Outlet Power Strip, 15A 125V 1875W, 90 Joules, 20-Inch Short Cord with Angled Plug, Small Power Strip Surge Protector, ETL Listed"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 140,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "The second item is a power strip (which may be more suitable for the image), but the first can also charge multiple things."
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 439,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Navigate to the category where I can find {{item}} that can help me {{function}}. Add the cheapest one to my cart.",
|
|
"intent": "Navigate to the category where I can find camera that can help me take photos like this. Add the cheapest one to my cart.",
|
|
"image": "https://images.pexels.com/photos/1618606/pexels-photo-1618606.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "camera",
|
|
"function": "take photos like this"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Action Camera Ultra HD 4K Action Camera 10m Waterproof 2.0' Screen 1080p Sport Camera Cam Driving Recorder Tachograph HD (Bundle : Camera Add 64GB Card, Color : Blue)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 141,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 440,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Navigate to the category where I can find {{item}} that can help me {{function}}. Add the cheapest one to my cart.",
|
|
"intent": "Navigate to the category where I can find the ingredient that can help me make the drink in the photo. Add the cheapest one to my cart.",
|
|
"image": "https://images.pexels.com/photos/15125130/pexels-photo-15125130/free-photo-of-coffee-beans-around-coffee-cup.jpeg",
|
|
"instantiation_dict": {
|
|
"item": "the ingredient",
|
|
"function": "make the drink in the photo"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Hills Bros Instant Sugar-Free Double Mocha Cappuccino Mix, Easy to Use, Enjoy Coffeehouse Flavor from Home, Frothy and 8 g of Carbs, 12 Oz"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 141,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 441,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "My kid loves horses, and I want a topper for this. Help me add the least expensive one to my wishlist.",
|
|
"intent": "My kid loves horses, and I want a topper for this. Help me add the least expensive one to my wishlist.",
|
|
"image": "https://images.pexels.com/photos/18955559/pexels-photo-18955559/free-photo-of-a-cupcake-with-strawberry-frosting.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Horse Cupcake Toppers Horse Racing Party Cake Decoration for Horse Theme Birthday Party Supplies SET of 24"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 142,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 442,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Put the least expensive item that has the thing in the first image {{relationship}} the thing in the second image in my wishlist",
|
|
"intent": "Put the least expensive item that has the thing in the first image in the shape of the thing in the second image in my wishlist",
|
|
"image": [
|
|
"https://images.pexels.com/photos/8680077/pexels-photo-8680077.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/2036544/pexels-photo-2036544.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"relationship": "in the shape of"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Student Flip Phone for Ferrari Car-Shape Phone Flip Keypad Car Model Mobile Phone GSM Cell Phone 100-240V, Support SMS, MP3, Camera, Video Playback, Recording, Radio, Bluetooth, Calculator(White)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 143,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 443,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Put the least expensive item that has the thing in the first image {{relationship}} the thing in the second image in my wishlist",
|
|
"intent": "Put the least expensive item that has the thing in the first image imprinted on the thing in the second image in my wishlist",
|
|
"image": [
|
|
"https://images.pexels.com/photos/18885866/pexels-photo-18885866/free-photo-of-person-in-deadpool-costume-on-bridge.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"https://images.pexels.com/photos/2323435/pexels-photo-2323435.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1"
|
|
],
|
|
"instantiation_dict": {
|
|
"relationship": "imprinted on"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/wishlist/?limit=50",
|
|
"locator": "document.querySelector('.products-grid.wishlist').textContent",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Vanknight Playstation 4 Dualshock PS4 Controller Skin Vinyl Decals Skins Stickers 2 Pack for PS4 Controller Skins PS4 Skins Deadpool"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 143,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 444,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/health-household/diet-sports-nutrition/nutrition-bars-drinks.html?price=40-50",
|
|
"geolocation": null,
|
|
"intent_template": "Place the item with {{quality}} on this page into my cart",
|
|
"intent": "Place the item with the highest amount of protein per bar on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "the highest amount of protein per bar"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Garden Of Life, Fit Bar Smores Organic, 1.9 Ounce"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 144,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 445,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/grocery-gourmet-food/breads-bakery/cookies.html?price=80-90",
|
|
"geolocation": null,
|
|
"intent_template": "Place the item with {{quality}} on this page into my cart",
|
|
"intent": "Place the item with the darkest packaging on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "the darkest packaging"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"B.A.D. FOOD CO The Peanutter - Peanut Butter Cookies | 5.4oz \u2013 12 Pack | , Grain-Free, Gluten-Free, Refined Sugar Free, No-Soy, Dairy-Free, Non-GMO, Paleo Friendly, and Nutrient Dense!"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 144,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "easy",
|
|
"overall_difficulty": "easy",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 446,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/electronics/television-video/televisions.html?p=4&price=0-100",
|
|
"geolocation": null,
|
|
"intent_template": "Place the item with {{quality}} on this page into my cart",
|
|
"intent": "Place the item with the thickest bezels on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "the thickest bezels"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SAMSUNG 40 inches LED Smart FDHTV 1080P (Renewed)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 144,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 447,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/cell-phones-accessories/cases-holsters-sleeves.html?price=10-20",
|
|
"geolocation": null,
|
|
"intent_template": "Add all the items with {{quality}} on this page into my cart",
|
|
"intent": "Add all the items with a strap on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "a strap"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"IKASEFU Compatible with iPhone 6 Plus/6S Plus Case Glitter Shiny butterfly Rhinestone Floral Pu Leather Diamond Flash Bling Wallet Strap Case with Card Holder Magnetic Kickstand Flip Cover,Rose gold",
|
|
"Compatible with Samsung Galaxy A51 4G Wallet Case and Tempered Glass Screen Protector Flip Card Holder Cell Accessories Folio Purse Phone Cover for Glaxay A 51 Gaxaly M40S 51A A515F S51 Blue"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 145,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 448,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/office-products/office-furniture-lighting/chairs-sofas.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add all the items with {{quality}} on this page into my cart",
|
|
"intent": "Add all the items with no armrests on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "no armrests"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Rolling Swivel Stool Chairs with Back Wheels Height Adjustable PU Leather Massage Chairs Round Stools with Wheels for Medical Clinic Salon Home Office Hobby Desk Grey",
|
|
"BOWERY HILL Metal 30'' Backless Bar Stool in Black-Antique Gold"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 145,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 449,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/patio-lawn-garden/gardening-lawn-care/plants-seeds-bulbs.html?p=3",
|
|
"geolocation": null,
|
|
"intent_template": "Add all the items with {{quality}} on this page into my cart",
|
|
"intent": "Add all the items with flowers on this page into my cart",
|
|
"instantiation_dict": {
|
|
"quality": "flowers"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Four (4) Orchid Cactus (Epiphyllum) 8\" Fresh Cuttings: 2 for White and 2 for Red Flower",
|
|
"Hirt's White Christmas Cactus Plant - Zygocactus - 6\" Pot",
|
|
"Hawaiian Red Plumeria Plant Cutting Kanoa Hawaii 1 Pack SK34",
|
|
"Knockout Double Pink Rose, 1 Gal"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 145,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 450,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/stackable-clear-shoe-box-front-drop-magnetic-door-dustproof-and-breathable-sneaker-storage-box-shoe-box-organizer-for-women-and-men-fit-up-to-us-size-16.html",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{item}} with the same {{characteristic}} as the majority of the {{items}} shown in the second image on this page and put it in my cart",
|
|
"intent": "Find me the cheapest shoe with the same brand as the majority of the shoes shown in the second image on this page and put it in my cart",
|
|
"instantiation_dict": {
|
|
"item": "shoe",
|
|
"items": "shoes",
|
|
"characteristic": "brand"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Nike SB Mens Charge Canvas Canvas Lifestyle Fashion Sneakers Gray 9.5 Medium (D)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 146,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 451,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{item}} {{condition}} and add one of any size to my shopping cart.",
|
|
"intent": "Find me the cheapest shoe with a multi-colored word printed on it and add one of any size to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "shoe",
|
|
"condition": "with a multi-colored word printed on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"SWEETSHOPZ Hummingbird Geometric Holographic Color White Active Running Walking Sneakers Shoes for Women Men Unisex Kids Adults Fashion Sports"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 147,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 452,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{item}} {{condition}} and add one of any size to my shopping cart.",
|
|
"intent": "Find me the cheapest shoe with marine life printed on it and add one of any size to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "shoe",
|
|
"condition": "with marine life printed on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"MAPOLO Animals Words Men's Boys Casual Walking Shoes Sneaker Lightweight Stylish Athletic Tennis Sports Running Shoes for Outdoor Hiking Travel Driving"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 147,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 453,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/sweetshopz-beer-irish-wallpaper-st-patrick-day-active-running-walking-sneakers-shoes-for-women-men-unisex-kids-adults-fashion-sports-black.html |AND| __SHOPPING__/clothing-shoes-jewelry/men/shoes.html?p=4&product_list_order=price",
|
|
"geolocation": null,
|
|
"intent_template": "Find me {{item}}. Add one (in any size) to my cart.",
|
|
"intent": "Find me a product in the Shoes tab that has the closest color to the sneakers in the other tab. Add one (in any size) to my cart.",
|
|
"instantiation_dict": {
|
|
"item": "a product in the Shoes tab that has the closest color to the sneakers in the other tab"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"HUTSENDOX Pillow Slippers Slides for Women Men House Cloud Slipper Shower Slide Sandals Anti-Slip Summer Slippers for Indoor Outdoor",
|
|
"Green"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 148,
|
|
"reasoning_difficulty": "medium",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 454,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/men-s-flip-flop-sandals-comfortable-slip-on-water-shoes-non-slip-flat-thong-sandals.html",
|
|
"geolocation": null,
|
|
"intent_template": "Find me the cheapest {{item}} {{condition}} and add one of any size to my shopping cart.",
|
|
"intent": "Find me the cheapest fruit between $40 and $60 that looks like these shoes and add one of any size to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "fruit",
|
|
"condition": "between $40 and $60 that looks like these shoes"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Small Hass Avocado"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 147,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 455,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/xue-juan-1983-feng-shui-decoration-modern-bubble-girl-sculpture-decoration-home-tv-cabinet-character-statue-decor-ornament-study-office-desktop-bust-character-resin-statue-ornaments-desktop-ornaments.html",
|
|
"geolocation": null,
|
|
"intent_template": "Find {{item}} {{condition}}. Add it to my shopping cart.",
|
|
"intent": "Find a wig between $50 and $100 that best matches this sculpture's hair. Add it to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "a wig",
|
|
"condition": "between $50 and $100 that best matches this sculpture's hair"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Gwen Wig Color 34 Dark Brown with Gray - Foxy Silver Wigs Short Feathered Cut Wispy Bangs Human Hair African American Womens Lightweight Average Cap Bundle w/MaxWigs Hairloss Booklet",
|
|
"Gray"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 149,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 456,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/wapbeng-white-european-and-american-wig-ladies-short-curly-hair-wig-42cm-womens-wigs-lovely-fashion-curly-cosplay-wigs.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add to my cart {{item}} {{condition}}.",
|
|
"intent": "Add to my cart a wig that looks most like this but with longer hair that is between $50 and $100.",
|
|
"instantiation_dict": {
|
|
"item": "a wig that looks most like this",
|
|
"condition": "but with longer hair that is between $50 and $100"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Wavy Hair Wigs - Wigs Synthetic Wigs,for Art Photo Shoot Wig Props and Cosplay Costume Full Wig 100% density (Silver)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 150,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 457,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/nachic-wall-3-piece-wall-art-for-bedroom-black-and-white-teal-rose-canvas-wall-art-still-life-flower-paintings-giclee-print-contemporary-bathroom-wall-decor-framed-ready-to-hang.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add to my cart {{item}} {{condition}}.",
|
|
"intent": "Add to my cart a poster set that looks like this but is pink and not more than $7 more expensive.",
|
|
"instantiation_dict": {
|
|
"item": "a poster set that looks like this",
|
|
"condition": "but is pink and not more than $7 more expensive"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"3 Piece Vintage Canvas Wall Art Pink Peony Flowers Bouquet with White Vase on Books Pictures Romantic Floral Painting Prints Gift Framed for Home Bathroom Bedroom Wall Decor 12\" x 16\" x 3 Panels"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 150,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 458,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/kokopelli-the-ancient-ones-kokopelli-southwest-cotton-woven-blanket-throw-made-in-the-usa-72x54.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add to my cart {{item}} {{condition}}.",
|
|
"intent": "Add to my cart all blankets (including this one) with the same two people holding up the blanket in the photo.",
|
|
"instantiation_dict": {
|
|
"item": "all blankets (including this one)",
|
|
"condition": "with the same two people holding up the blanket in the photo"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Aracnafaria - Anne Stokes Gothic Collection - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Heaven's Gate 1 - and God Will Open Wide The Gates of Heaven - Scriptures - 2 Peter 1:11 - Sympathy - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Jesus Footprints in The Sand - Sympathy - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Kokopelli The Ancient Ones - Kokopelli - Southwest - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Russet and Green - Southwest Native American Inspired Tribal Camp - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"US Marine Corps - Land Sea Air - Cotton Woven Blanket Throw - Made in The USA (72x54)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 150,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "Can be solved by searching for 'Pure Country Weavers blankets'"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 459,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/butterfly-dance-helen-vladykina-cotton-woven-blanket-throw-made-in-the-usa-72x54.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add to my cart {{item}} {{condition}}.",
|
|
"intent": "Add to my cart all blankets (including this one) with the same two people holding up the blanket in the photo.",
|
|
"instantiation_dict": {
|
|
"item": "all blankets (including this one)",
|
|
"condition": "with the same two people holding up the blanket in the photo"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Frida Kahlo - Beautiful and Strong - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Hawk - Animal Spirits Totem - Sue Coccia - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Sloth Wanna Hang - Victoria Borges - Cotton Woven Blanket Throw - Made in The USA (72x54)",
|
|
"Butterfly Dance - Helen Vladykina - Cotton Woven Blanket Throw - Made in The USA (72x54)"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 150,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": "Can be solved by searching for 'Pure Country Weavers blankets'"
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 460,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/vinyl-skin-sticker-for-playstation-4-pro-blue-fire-ps4-pro-console-and-controllers-skins-vinyl-sticker-decal-cover.html",
|
|
"geolocation": null,
|
|
"intent_template": "I've been thinking about ordering {{item}}, but {{condition}}. Can you add it to my shopping cart if it exists?",
|
|
"intent": "I've been thinking about ordering an Xbox One controller shell, but one that has a matte finish. Can you add it to my shopping cart if it exists?",
|
|
"instantiation_dict": {
|
|
"item": "an Xbox One controller shell",
|
|
"condition": "one that has a matte finish"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"eXtremeRate Blue Flame Faceplate Cover, Soft Touch Front Housing Shell Case, Comfortable Soft Grip Replacement Kit for Microsoft Xbox One X & One S Controller Model 1708 - Controller NOT Included"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 59,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 461,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__",
|
|
"geolocation": null,
|
|
"intent_template": "Add to my cart {{item}} {{condition}}.",
|
|
"intent": "Add to my cart a wig that costs between $50 and $100 and can help me cosplay the character in the image.",
|
|
"image": "https://images.pexels.com/photos/13352513/pexels-photo-13352513.jpeg?auto=compress&cs=tinysrgb&w=1260&h=750&dpr=1",
|
|
"instantiation_dict": {
|
|
"item": "a wig that costs between $50 and $100",
|
|
"condition": "and can help me cosplay the character in the image"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Anime Vocaloid Hatsune Miku Synthetic Wig Costume Game Play Wigs Cosplay miku Long wavy blue Hair Wigs + wig cap One Size PL-823"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 150,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 462,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/noldares-womens-heeled-sandals-fashion-squared-toe-backless-indoor-sandals-mules-stiletto-high-heels-slip-on-heeled-slippers.html",
|
|
"geolocation": null,
|
|
"intent_template": "Find {{item}} {{condition}}. Add it to my shopping cart.",
|
|
"intent": "Find a zebra-striped version of these heels from the same brand with the same pyramid shaped base. Add it to my shopping cart.",
|
|
"instantiation_dict": {
|
|
"item": "a zebra-striped version of these heels from the same brand",
|
|
"condition": "with the same pyramid shaped base"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"NOLDARES Heels for Women Heeled Sandals Slip-On Casual Square Toe Slippers Sandals Fashion Stilettos Heeled Party Single Pumps"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 149,
|
|
"reasoning_difficulty": "hard",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 463,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/motivational-posters-for-classroom-office-decorations-inspirational-quote-wall-art-for-teachers-students-school-counselors-home-office-set-of-10-creative-chalkboard-designs.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this (in any size) to my cart if {{condition}}",
|
|
"intent": "Add this (in any size) to my cart if the at least one of the posters has the word \"inspire\" printed on it",
|
|
"instantiation_dict": {
|
|
"condition": "the at least one of the posters has the word \"inspire\" printed on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_exclude": [
|
|
"Motivational Posters for Classroom & Office Decorations | Inspirational Quote Wall Art for Teachers, Students, School Counselors, Home & Office | Set of 10 Creative Chalkboard Designs"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 151,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "hard",
|
|
"overall_difficulty": "hard",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 464,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/love-live-quote-art-wall-canvas-painting-dream-art-picture-black-white-print-and-poster-for-living-room-home-decor-70x100cm-3pcs-frameless.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this (in any size) to my cart if {{condition}}",
|
|
"intent": "Add this (in any size) to my cart if the at least one of the posters has the word \"love\" printed on it",
|
|
"instantiation_dict": {
|
|
"condition": "the at least one of the posters has the word \"love\" printed on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_include": [
|
|
"Love Live Quote Art Wall Canvas Painting Dream Art Picture Black White Print And Poster For Living Room Home Decor (70x100cm\u00d73pcs) Frameless"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 151,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
},
|
|
{
|
|
"sites": [
|
|
"shopping"
|
|
],
|
|
"task_id": 465,
|
|
"require_login": true,
|
|
"storage_state": "./.auth/shopping_state.json",
|
|
"start_url": "__SHOPPING__/ihappywall-3-pieces-bathroom-canvas-wall-art-teal-style-bathtub-bath-set-towel-relax-soothe-unwind-bathroom-still-life-picture-poster-print-on-canvas-stretched-and-framed-ready-to-hang.html",
|
|
"geolocation": null,
|
|
"intent_template": "Add this (in any size) to my cart if {{condition}}",
|
|
"intent": "Add this (in any size) to my cart if the at least one of the posters has the word \"happy\" printed on it",
|
|
"instantiation_dict": {
|
|
"condition": "the at least one of the posters has the word \"happy\" printed on it"
|
|
},
|
|
"require_reset": false,
|
|
"eval": {
|
|
"eval_types": [
|
|
"program_html"
|
|
],
|
|
"reference_answers": null,
|
|
"reference_url": "",
|
|
"program_html": [
|
|
{
|
|
"url": "__SHOPPING__/checkout/cart",
|
|
"locator": "",
|
|
"required_contents": {
|
|
"must_exclude": [
|
|
"iHAPPYWALL 3 Pieces Bathroom Canvas Wall Art Teal Style Bathtub Bath Set Towel Relax Soothe Unwind Bathroom Still Life Picture Poster Print On Canvas Stretched and Framed Ready To Hang"
|
|
]
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"intent_template_id": 151,
|
|
"reasoning_difficulty": "easy",
|
|
"visual_difficulty": "medium",
|
|
"overall_difficulty": "medium",
|
|
"comments": ""
|
|
}
|
|
] |