Skip to content

Commit 1baa79b

Browse files
Merge branch 'main' into remove-dataset-formatting-module
2 parents 1bda85f + 68ef15c commit 1baa79b

File tree

3 files changed

+7
-160
lines changed

3 files changed

+7
-160
lines changed

.github/workflows/slow-tests.yml

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -115,6 +115,4 @@ jobs:
115115
source .venv/bin/activate
116116
uv pip install slack_sdk tabulate
117117
python scripts/log_reports.py >> $GITHUB_STEP_SUMMARY
118-
python scripts/log_example_reports.py --text_file_name temp_results_sft_tests.txt >> $GITHUB_STEP_SUMMARY
119-
python scripts/log_example_reports.py --text_file_name temp_results_dpo_tests.txt >> $GITHUB_STEP_SUMMARY
120118
rm *.txt

scripts/log_example_reports.py

Lines changed: 0 additions & 158 deletions
This file was deleted.

tests/test_judges.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@
1212
# See the License for the specific language governing permissions and
1313
# limitations under the License.
1414

15+
import sys
1516
import time
1617

1718
import pytest
@@ -59,6 +60,9 @@ def load_pair_rm_judge(self):
5960
raise ValueError("Failed to load PairRMJudge")
6061

6162
@require_llm_blender
63+
@pytest.mark.skipif(
64+
sys.version_info == (3, 13, 8), reason="Python 3.13.8 has a bug in inspect.BlockFinder (cpython GH-139783)"
65+
)
6266
def test_pair_rm_judge(self):
6367
judge = self.load_pair_rm_judge()
6468
prompts, completions = self._get_prompts_and_pairwise_completions()
@@ -68,6 +72,9 @@ def test_pair_rm_judge(self):
6872
assert ranks == [0, 1]
6973

7074
@require_llm_blender
75+
@pytest.mark.skipif(
76+
sys.version_info == (3, 13, 8), reason="Python 3.13.8 has a bug in inspect.BlockFinder (cpython GH-139783)"
77+
)
7178
def test_pair_rm_judge_return_scores(self):
7279
judge = self.load_pair_rm_judge()
7380
prompts, completions = self._get_prompts_and_pairwise_completions()

0 commit comments

Comments
 (0)