Quality_evaluation/stuff/main.py
Aleksandr Dubchak 98d5e90894 mind2web
2026-04-23 00:04:11 +03:00

22 lines
No EOL
491 B
Python
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

from loaders import load_mind2web_tasks
from runner import run_many_tasks
# твой агент (как у тебя уже есть)
from agent import agent
def main():
tasks = load_mind2web_tasks(
"../Mind2Web/test_task/test_task_2.json",
limit=2
)
results = run_many_tasks(tasks, agent)
print("\n=== FINAL RESULTS ===")
print(f"Total: {len(results)}")
print(f"Success: {sum(r.success for r in results)}")
if __name__ == "__main__":
main()