From aac5eaab8c5304f059ed61bbbf56927240a77099 Mon Sep 17 00:00:00 2001 From: Maxime Gasse Date: Thu, 31 Oct 2024 10:49:56 -0400 Subject: [PATCH] Fix duplicate depends_on in webarena metadata (#228) --- .../benchmark/metadata/webarena.csv | 46 +++++++++---------- 1 file changed, 23 insertions(+), 23 deletions(-) diff --git a/browsergym/experiments/src/browsergym/experiments/benchmark/metadata/webarena.csv b/browsergym/experiments/src/browsergym/experiments/benchmark/metadata/webarena.csv index 1161b756..2c9a55e5 100644 --- a/browsergym/experiments/src/browsergym/experiments/benchmark/metadata/webarena.csv +++ b/browsergym/experiments/src/browsergym/experiments/benchmark/metadata/webarena.csv @@ -551,10 +551,10 @@ webarena.548,False,shopping_admin,program_html,548,train,webarena.547 webarena.549,False,shopping_admin,program_html,549,test,webarena.548 webarena.550,False,shopping_admin,program_html,550,train,webarena.549 webarena.551,False,shopping_admin,program_html,551,test,webarena.550 -webarena.552,False,gitlab reddit,program_html,552,test,webarena.537 webarena.410 -webarena.553,False,gitlab reddit,program_html,553,test,webarena.552 webarena.552 -webarena.554,False,gitlab reddit,program_html,554,test,webarena.553 webarena.553 -webarena.555,False,gitlab reddit,program_html,555,test,webarena.554 webarena.554 +webarena.552,False,gitlab reddit,program_html,552,test,webarena.410 webarena.537 +webarena.553,False,gitlab reddit,program_html,553,test,webarena.552 +webarena.554,False,gitlab reddit,program_html,554,test,webarena.553 +webarena.555,False,gitlab reddit,program_html,555,test,webarena.554 webarena.556,False,gitlab wikipedia,program_html,556,train,webarena.555 webarena.557,False,gitlab wikipedia,program_html,557,test,webarena.556 webarena.558,False,gitlab wikipedia,program_html,558,train,webarena.557 @@ -562,10 +562,10 @@ webarena.559,False,gitlab wikipedia,program_html,559,train,webarena.558 webarena.560,False,gitlab wikipedia,program_html,560,test,webarena.559 webarena.561,False,gitlab wikipedia,program_html,561,test,webarena.560 webarena.562,False,gitlab reddit,program_html,562,train,webarena.561 webarena.555 -webarena.563,False,gitlab reddit,program_html,563,train,webarena.562 webarena.562 -webarena.564,False,gitlab reddit,program_html,564,train,webarena.563 webarena.563 -webarena.565,False,gitlab reddit,program_html,565,test,webarena.564 webarena.564 -webarena.566,False,gitlab reddit,program_html,566,test,webarena.565 webarena.565 +webarena.563,False,gitlab reddit,program_html,563,train,webarena.562 +webarena.564,False,gitlab reddit,program_html,564,train,webarena.563 +webarena.565,False,gitlab reddit,program_html,565,test,webarena.564 +webarena.566,False,gitlab reddit,program_html,566,test,webarena.565 webarena.567,False,gitlab,program_html,567,test,webarena.566 webarena.568,False,gitlab,program_html,568,train,webarena.567 webarena.569,False,gitlab,program_html,569,train,webarena.568 @@ -671,23 +671,23 @@ webarena.668,False,gitlab,url_match program_html,668,test,webarena.667 webarena.669,False,gitlab,url_match program_html,669,test,webarena.668 webarena.670,False,gitlab,url_match program_html,670,train,webarena.669 webarena.671,False,shopping reddit,url_match program_html,671,train,webarena.657 webarena.652 -webarena.672,False,shopping reddit,url_match program_html,672,train,webarena.671 webarena.671 -webarena.673,False,shopping reddit,url_match program_html,673,test,webarena.672 webarena.672 -webarena.674,False,shopping reddit,url_match program_html,674,test,webarena.673 webarena.673 -webarena.675,False,shopping reddit,url_match program_html,675,train,webarena.674 webarena.674 +webarena.672,False,shopping reddit,url_match program_html,672,train,webarena.671 +webarena.673,False,shopping reddit,url_match program_html,673,test,webarena.672 +webarena.674,False,shopping reddit,url_match program_html,674,test,webarena.673 +webarena.675,False,shopping reddit,url_match program_html,675,train,webarena.674 webarena.676,False,shopping_admin,url_match program_html,676,test,webarena.551 webarena.677,False,shopping_admin,url_match program_html,677,test,webarena.676 webarena.678,False,shopping_admin,url_match program_html,678,train,webarena.677 webarena.679,False,shopping_admin,url_match program_html,679,train,webarena.678 webarena.680,False,shopping_admin,url_match program_html,680,train,webarena.679 -webarena.681,False,reddit gitlab,url_match program_html,681,train,webarena.675 webarena.670 -webarena.682,False,reddit gitlab,url_match program_html,682,train,webarena.681 webarena.681 -webarena.683,False,reddit gitlab,url_match program_html,683,test,webarena.682 webarena.682 -webarena.684,False,reddit gitlab,url_match program_html,684,train,webarena.683 webarena.683 -webarena.685,False,reddit gitlab,url_match program_html,685,train,webarena.684 webarena.684 -webarena.686,False,reddit gitlab,url_match program_html,686,train,webarena.685 webarena.685 -webarena.687,False,reddit gitlab,url_match program_html,687,test,webarena.686 webarena.686 -webarena.688,False,reddit gitlab,url_match program_html,688,test,webarena.687 webarena.687 +webarena.681,False,reddit gitlab,url_match program_html,681,train,webarena.670 webarena.675 +webarena.682,False,reddit gitlab,url_match program_html,682,train,webarena.681 +webarena.683,False,reddit gitlab,url_match program_html,683,test,webarena.682 +webarena.684,False,reddit gitlab,url_match program_html,684,train,webarena.683 +webarena.685,False,reddit gitlab,url_match program_html,685,train,webarena.684 +webarena.686,False,reddit gitlab,url_match program_html,686,train,webarena.685 +webarena.687,False,reddit gitlab,url_match program_html,687,test,webarena.686 +webarena.688,False,reddit gitlab,url_match program_html,688,test,webarena.687 webarena.689,False,shopping,url_match program_html,689,test,webarena.675 webarena.690,False,shopping,url_match program_html,690,test,webarena.689 webarena.691,False,shopping,url_match program_html,691,train,webarena.690 @@ -758,8 +758,8 @@ webarena.755,False,gitlab,program_html,755,test,webarena.754 webarena.756,False,gitlab,program_html,756,train,webarena.755 webarena.757,False,map,program_html,757,test,webarena.741 webarena.758,False,map,program_html,758,test,webarena.757 -webarena.759,False,map shopping_admin,program_html,759,test,webarena.758 webarena.713 -webarena.760,False,map shopping_admin,program_html,760,test,webarena.759 webarena.759 +webarena.759,False,map shopping_admin,program_html,759,test,webarena.713 webarena.758 +webarena.760,False,map shopping_admin,program_html,760,test,webarena.759 webarena.761,False,map,program_html,761,train,webarena.760 webarena.762,False,map,program_html,762,train,webarena.761 webarena.763,False,map,program_html,763,test,webarena.762 @@ -790,7 +790,7 @@ webarena.787,False,gitlab,string_match,787,test,webarena.786 webarena.788,False,gitlab,string_match,788,test,webarena.787 webarena.789,False,gitlab,string_match,789,test,webarena.788 webarena.790,False,shopping_admin,string_match,790,test,webarena.782 -webarena.791,False,gitlab reddit,string_match,791,train,webarena.789 webarena.735 +webarena.791,False,gitlab reddit,string_match,791,train,webarena.735 webarena.789 webarena.792,False,shopping,string_match,792,test,webarena.693 webarena.793,False,shopping,string_match,793,train,webarena.792 webarena.794,False,shopping,string_match,794,test,webarena.793