fix: apply review suggestions

Pouyanpi · Pouyanpi · commit 482e725d0727 · 2025-04-11T12:01:12.000+02:00
diff --git a/tests/constants.py b/tests/constants.py
diff --git a/tests/test_configs/autoalign/config.yml b/tests/test_configs/autoalign/config.yml
@@ -1,7 +1,7 @@
 models:
   - type: main
-    engine: nemollm
-    model: gpt-43b-002
+    engine: openai
+    model: gpt-3.5-turbo-instruct
 
 rails:
   config:
diff --git a/tests/test_configs/fact_checking/config.yml b/tests/test_configs/fact_checking/config.yml
@@ -1,7 +1,7 @@
 models:
   - type: main
     engine: openai
-    model: gpt-3.5-instruct-turbo
+    model: gpt-3.5-turbo-instruct
 
 rails:
   config:
diff --git a/tests/test_fact_checking.py b/tests/test_fact_checking.py
@@ -21,7 +21,6 @@
 from nemoguardrails import RailsConfig
 from nemoguardrails.actions.actions import ActionResult, action
 from nemoguardrails.llm.providers.trtllm import llm
-from tests.constants import NEMO_API_URL_GPT_43B_002
 from tests.utils import TestChat
 
 CONFIGS_FOLDER = os.path.join(os.path.dirname(__file__), ".", "test_configs")
@@ -113,43 +112,6 @@ async def test_fact_checking_wrong(httpx_mock):
         await chat.bot_async("I don't know the answer to that.")
 
 
-# TODO: fix this!
-@pytest.mark.skip(reason="Not sure why it fails.")
-@pytest.mark.asyncio
-async def test_fact_checking_uncertain(httpx_mock):
-    # Test 4 - Factual statement - AlignScore not very confident in its prediction
-    config = RailsConfig.from_path(os.path.join(CONFIGS_FOLDER, "fact_checking"))
-    chat = TestChat(config)
-    chat.app.register_action(retrieve_relevant_chunks, "retrieve_relevant_chunks")
-
-    httpx_mock.add_response(
-        method="POST",
-        url=NEMO_API_URL_GPT_43B_002,
-        json={"text": "  ask about guardrails"},
-    )
-
-    httpx_mock.add_response(
-        method="POST",
-        url=NEMO_API_URL_GPT_43B_002,
-        json={
-            "text": "NeMo Guardrails is a closed-source proprietary toolkit by Nvidia."
-        },
-    )
-
-    with aioresponses() as m:
-        ## Fact-checking using AlignScore
-        m.post(
-            "http://localhost:5000/alignscore_base",
-            payload={"alignscore": 0.58},
-        )
-
-        chat >> "What is NeMo Guardrails?"
-        await chat.bot_async(
-            "NeMo Guardrails is a closed-source proprietary toolkit by Nvidia.\n"
-            + "Attention: the answer above is potentially inaccurate."
-        )
-
-
 @pytest.mark.asyncio
 async def test_fact_checking_fallback_to_self_check_correct(httpx_mock):
     # Test 4 - Factual statement - AlignScore endpoint not set up properly, use ask llm for fact-checking