Skip to content

Commit 70ec17e

Browse files
authored
Update test_llm_api_pytorch.py
Signed-off-by: Yi Zhang <187001205+yizhang-nv@users.noreply.github.com>
1 parent 879eac7 commit 70ec17e

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1330,7 +1330,7 @@ class TestDeepSeekR1(LlmapiAccuracyTestHarness):
13301330
def test_nvfp4_multi_gpus(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,
13311331
attention_dp, cuda_graph, overlap_scheduler,
13321332
max_batch_size, moe_backend):
1333-
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.80)
1333+
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.70)
13341334
pytorch_config = dict(
13351335
disable_overlap_scheduler=not overlap_scheduler,
13361336
cuda_graph_config=CudaGraphConfig() if cuda_graph else None,

0 commit comments

Comments
 (0)