tests add for api
This commit is contained in:
parent
5aeb26b222
commit
be86dc34d6
2 changed files with 249 additions and 0 deletions
52
api/mind2web_benchmark.json
Normal file
52
api/mind2web_benchmark.json
Normal file
|
|
@ -0,0 +1,52 @@
|
|||
[
|
||||
{
|
||||
"index": 3,
|
||||
"original_task_id": "mind2web_3_1776818853",
|
||||
"api_task_id": "80a5c0420dc244a8afccb3b89742089d",
|
||||
"task_description": "Show me the coming soon AMC Artisan Films in amctheatres",
|
||||
"reference_length": 6,
|
||||
"status": "succeeded",
|
||||
"queue_time_sec": 0.02,
|
||||
"execution_time_sec": 40.26,
|
||||
"total_time_sec": 40.26,
|
||||
"result": {
|
||||
"task_id": "80a5c0420dc244a8afccb3b89742089d",
|
||||
"status": "succeeded",
|
||||
"success": true,
|
||||
"execution_time": 39.63884091377258,
|
||||
"result": "**Coming Soon AMC Artisan Films**\n\nHere are all the upcoming AMC Artisan Films currently listed:\n\n| Film Title | Release Date |\n|------------|--------------|\n| **Hamlet** | April 10, 2026 |\n| **The AI Doc: Or How I Became an Apocaloptimist** | April 17, 2026 |\n| **Lorne** | April 17, 2026 |\n| **Mother Mary** | April 17, 2026 |\n| **MICHAEL** | April 24, 2026 |\n\nAll films are available for ticket purchase through AMC Theatres website.",
|
||||
"error": null,
|
||||
"raw_response": {
|
||||
"success": true,
|
||||
"result": "**Coming Soon AMC Artisan Films**\n\nHere are all the upcoming AMC Artisan Films currently listed:\n\n| Film Title | Release Date |\n|------------|--------------|\n| **Hamlet** | April 10, 2026 |\n| **The AI Doc: Or How I Became an Apocaloptimist** | April 17, 2026 |\n| **Lorne** | April 17, 2026 |\n| **Mother Mary** | April 17, 2026 |\n| **MICHAEL** | April 24, 2026 |\n\nAll films are available for ticket purchase through AMC Theatres website.",
|
||||
"browser_view": "https://face-veteran-investigate-daniel.trycloudflare.com"
|
||||
}
|
||||
},
|
||||
"timestamp": "2026-04-22T03:48:13.806637"
|
||||
},
|
||||
{
|
||||
"index": 4,
|
||||
"original_task_id": "mind2web_4_1776818893",
|
||||
"api_task_id": "6dffc48b440d4a56b82d13f2a3a60b3e",
|
||||
"task_description": "Go to the page with help in choosing a solar energy product for homes in tesla",
|
||||
"reference_length": 5,
|
||||
"status": "succeeded",
|
||||
"queue_time_sec": 0.01,
|
||||
"execution_time_sec": 251.22,
|
||||
"total_time_sec": 251.22,
|
||||
"result": {
|
||||
"task_id": "6dffc48b440d4a56b82d13f2a3a60b3e",
|
||||
"status": "succeeded",
|
||||
"success": true,
|
||||
"execution_time": 249.99302887916565,
|
||||
"result": "**Tesla Solar Energy Products Guide - Research Summary**\n\nDue to persistent access restrictions (403 errors) on Tesla's official website preventing direct navigation to product pages (/solarpanels, /powerwall, /why-solar), I gathered comprehensive information from third-party sources.\n\n**Tesla Home Solar Products Available:**\n\n**1. Solar Panels (Traditional)**\n- **Cost:** $8,100-$17,000 after federal tax credit (for average home)\n- **Efficiency:** ~2.74-$3.30 per watt; typical systems achieve $36k before incentives\n- **Best For:** Budget-conscious homeowners prioritizing performance over aesthetics\n\n**2. Solar Roof**\n- **Cost:** $54,000-$72,000 for average 9kW system ($6-8/watt)\n- **Efficiency:** Only 8-14% (vs traditional panels at 20-22%) - rated poorly at 3/25\n- **Warranty:** 25 years equipment & efficiency coverage\n- **Degradation:** Poor - only guarantees 95% after year 5, drops to ~85% after year 25\n- **Durability:** Class F wind (110 mph), Class 4 hail (2-inch), Class A fire rating\n- **Best For:** Homeowners prioritizing aesthetics over performance; willing to pay premium for integrated roof appearance\n\n**3. Powerwall (Energy Storage)**\n- **Cost:** $13,配 k-$16配 k each\n- **Best For:** Energy independence; backup power; maximizing solar self-consumption\n\n**Key Recommendations:**\n✅ Choose Traditional Solar Panels if:\n - You want better value (~half the cost of Solar Roof)\n - Performance/efficiency is your priority\n - You already have a functional roof\n \n❌ Avoid Solar Roof unless:\n - Aesthetics are your #1 priority (looks like regular shingles)\n - You need a new roof anyway and want integrated solution\n - Budget is not a concern ($6k+ premium over traditional panels)\n \n⚠️ Important Notes:\n - Solar Roof has poor efficiency degradation compared to competitors like Maxeon (which offers better warranties up to 40 years)\n - Labor warranty comes from installer (~10 years industry average) not Tesla directly\n - Snow slides off easily despite no published snow load rating\n \nTo proceed with ordering or getting exact quotes for your home location:\n→ Visit tesla.com directly or contact local installers through third-party platforms like EnergySage or SunPower dealers.",
|
||||
"error": null,
|
||||
"raw_response": {
|
||||
"success": true,
|
||||
"result": "**Tesla Solar Energy Products Guide - Research Summary**\n\nDue to persistent access restrictions (403 errors) on Tesla's official website preventing direct navigation to product pages (/solarpanels, /powerwall, /why-solar), I gathered comprehensive information from third-party sources.\n\n**Tesla Home Solar Products Available:**\n\n**1. Solar Panels (Traditional)**\n- **Cost:** $8,100-$17,000 after federal tax credit (for average home)\n- **Efficiency:** ~2.74-$3.30 per watt; typical systems achieve $36k before incentives\n- **Best For:** Budget-conscious homeowners prioritizing performance over aesthetics\n\n**2. Solar Roof**\n- **Cost:** $54,000-$72,000 for average 9kW system ($6-8/watt)\n- **Efficiency:** Only 8-14% (vs traditional panels at 20-22%) - rated poorly at 3/25\n- **Warranty:** 25 years equipment & efficiency coverage\n- **Degradation:** Poor - only guarantees 95% after year 5, drops to ~85% after year 25\n- **Durability:** Class F wind (110 mph), Class 4 hail (2-inch), Class A fire rating\n- **Best For:** Homeowners prioritizing aesthetics over performance; willing to pay premium for integrated roof appearance\n\n**3. Powerwall (Energy Storage)**\n- **Cost:** $13,配 k-$16配 k each\n- **Best For:** Energy independence; backup power; maximizing solar self-consumption\n\n**Key Recommendations:**\n✅ Choose Traditional Solar Panels if:\n - You want better value (~half the cost of Solar Roof)\n - Performance/efficiency is your priority\n - You already have a functional roof\n \n❌ Avoid Solar Roof unless:\n - Aesthetics are your #1 priority (looks like regular shingles)\n - You need a new roof anyway and want integrated solution\n - Budget is not a concern ($6k+ premium over traditional panels)\n \n⚠️ Important Notes:\n - Solar Roof has poor efficiency degradation compared to competitors like Maxeon (which offers better warranties up to 40 years)\n - Labor warranty comes from installer (~10 years industry average) not Tesla directly\n - Snow slides off easily despite no published snow load rating\n \nTo proceed with ordering or getting exact quotes for your home location:\n→ Visit tesla.com directly or contact local installers through third-party platforms like EnergySage or SunPower dealers.",
|
||||
"browser_view": "https://face-veteran-investigate-daniel.trycloudflare.com"
|
||||
}
|
||||
},
|
||||
"timestamp": "2026-04-22T03:52:25.037604"
|
||||
}
|
||||
]
|
||||
Loading…
Add table
Add a link
Reference in a new issue