Skip to content

Commit

Permalink
Miniwob number of seeds 10 -> 5
Browse files Browse the repository at this point in the history
  • Loading branch information
gasse authored Oct 21, 2024
1 parent 8102b64 commit e1bc6b0
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions tests/experiments/test_benchmark.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,10 +47,10 @@ def make_agent(self):
def test_build_benchmarks():
expected_bench_size = {
"miniwob_all": 125 * 5,
"miniwob_webgum": 56 * 10,
"miniwob_webgum": 56 * 5,
"miniwob_tiny_test": 2 * 2,
"miniwob_train": 107 * 10,
"miniwob_test": 18 * 10,
"miniwob_train": 107 * 5,
"miniwob_test": 18 * 5,
"webarena": 812,
"visualwebarena": 910,
"workarena_l1": 33 * 10,
Expand All @@ -72,7 +72,7 @@ def test_benchmark_subset():
benchmark: Benchmark = BENCHMARKS["miniwob_all"]()

benchmark_subset = benchmark.subset_from_regexp(column="task_name", regexp="click")
assert len(benchmark_subset.env_args_list) == 31 * 10
assert len(benchmark_subset.env_args_list) == 31 * 5
assert benchmark_subset.name == "miniwob_all[task_name=/click/]"

benchmark_subset_1 = benchmark_subset.subset_from_regexp(
Expand Down

0 comments on commit e1bc6b0

Please sign in to comment.