Skip to content

Commit

Permalink
ci tests
Browse files Browse the repository at this point in the history
  • Loading branch information
gasse committed Nov 1, 2024
1 parent 2404283 commit 3e0a3d2
Showing 1 changed file with 20 additions and 4 deletions.
24 changes: 20 additions & 4 deletions tests/experiments/test_benchmark.py
Original file line number Diff line number Diff line change
Expand Up @@ -91,7 +91,7 @@ def test_benchmark_subset():
assert dict_1 == dict_2


def test_miniwob_benchmark_reset():
def test_prepare_backend_miniwob():
MINIWOB_URL = os.environ["MINIWOB_URL"]
try:
benchmark: Benchmark = DEFAULT_BENCHMARKS["miniwob"]()
Expand All @@ -109,13 +109,13 @@ def test_miniwob_benchmark_reset():
os.environ["MINIWOB_URL"] = MINIWOB_URL


def test_assistantbench_benchmark_reset():
def test_prepare_backend_assistantbench():
benchmark: Benchmark = DEFAULT_BENCHMARKS["assistantbench"]()
benchmark.prepare_backends()


@pytest.mark.skip
def test_webarena_benchmark_reset():
def test_prepare_backend_webarena():
WA_FULL_RESET = os.environ["WA_FULL_RESET"]
try:
benchmark: Benchmark = DEFAULT_BENCHMARKS["webarena"]()
Expand All @@ -134,7 +134,7 @@ def test_webarena_benchmark_reset():


@pytest.mark.skip
def test_visualwebarena_benchmark_reset():
def test_prepare_backend_visualwebarena():
VWA_FULL_RESET = os.environ["VWA_FULL_RESET"]
try:
benchmark: Benchmark = DEFAULT_BENCHMARKS["visualwebarena"]()
Expand All @@ -152,6 +152,22 @@ def test_visualwebarena_benchmark_reset():
os.environ["VWA_FULL_RESET"] = VWA_FULL_RESET


@pytest.mark.skip
def test_prepare_backend_weblinx():
BROWSERGYM_WEBLINX_CACHE_DIR = os.environ["BROWSERGYM_WEBLINX_CACHE_DIR"]
try:
benchmark: Benchmark = DEFAULT_BENCHMARKS["weblinx"]()

benchmark.prepare_backends()

del os.environ["BROWSERGYM_WEBLINX_CACHE_DIR"]
with pytest.raises(Exception):
benchmark.prepare_backends()

finally:
os.environ["BROWSERGYM_WEBLINX_CACHE_DIR"] = BROWSERGYM_WEBLINX_CACHE_DIR


def test_run_mock_benchmark():
benchmark = Benchmark(
name="miniwob_click_test",
Expand Down

0 comments on commit 3e0a3d2

Please sign in to comment.