make test configurable

ZichengMa · ZichengMa · commit 6f56d79844c8 · 2025-07-16T17:15:36.000-07:00
diff --git a/tests/lmcache/1-mmlu-dynamo.py b/tests/lmcache/1-mmlu-dynamo.py
@@ -2,7 +2,7 @@
 # Reference: https://github.com/LMCache/LMCache/blob/dev/.buildkite/correctness/1-mmlu.py
 
 # ASSUMPTIONS:
-# 1. dynamo is running on port 8080 without LMCache
+# 1. dynamo is running (default: localhost:8080) without LMCache
 # 2. the mmlu dataset is in a "data" directory
 # 3. all invocations of this script should be run in the same directory
 #    (for later consolidation)
@@ -41,7 +41,8 @@ def get_llm_response(args, prompt):
         "stream": False,
         "seed": 42,  # Add explicit seed for determinism
     }
-    res = requests.post("http://localhost:8080/v1/chat/completions", json=data, timeout=30)
+    url = f"http://{args.host}:{args.port}/v1/chat/completions"
+    res = requests.post(url, json=data, timeout=30)
     if res.status_code != 200:
         raise Exception(f"Error: {res.status_code} {res.text}")
     response_json = res.json()
@@ -159,6 +160,8 @@ def main(args):
     parser.add_argument("--model", type=str, required=True)
     parser.add_argument("--result-file", type=str, required=False)
     parser.add_argument("--number-of-subjects", type=int, required=True)
+    parser.add_argument("--host", type=str, default="localhost", help="Dynamo host")
+    parser.add_argument("--port", type=int, default=8080, help="Dynamo port")
 
     args = parser.parse_args()
     if args.result_file is None:
diff --git a/tests/lmcache/2-mmlu-dynamo.py b/tests/lmcache/2-mmlu-dynamo.py
@@ -2,7 +2,7 @@
 # Reference: https://github.com/LMCache/LMCache/blob/dev/.buildkite/correctness/2-mmlu.py
 
 # ASSUMPTIONS:
-# 1. dynamo is running on port 8080 with LMCache enabled
+# 1. dynamo is running (default: localhost:8080) with LMCache enabled
 # 2. the mmlu dataset is in a "data" directory
 # 3. all invocations of this script should be run in the same directory
 #    (for later consolidation)
@@ -41,7 +41,8 @@ def get_llm_response(args, prompt):
         "stream": False,
         "seed": 42,  # Add explicit seed for determinism
     }
-    res = requests.post("http://localhost:8080/v1/chat/completions", json=data, timeout=30)
+    url = f"http://{args.host}:{args.port}/v1/chat/completions"
+    res = requests.post(url, json=data, timeout=30)
     if res.status_code != 200:
         raise Exception(f"Error: {res.status_code} {res.text}")
     response_json = res.json()
@@ -159,6 +160,8 @@ def main(args):
     parser.add_argument("--model", type=str, required=True)
     parser.add_argument("--result-file", type=str, required=False)
     parser.add_argument("--number-of-subjects", type=int, required=True)
+    parser.add_argument("--host", type=str, default="localhost", help="Dynamo host")
+    parser.add_argument("--port", type=int, default=8080, help="Dynamo port")
 
     args = parser.parse_args()
     if args.result_file is None: