We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e748de1 commit 32ada21Copy full SHA for 32ada21
nemo_rl/algorithms/grpo.py
@@ -309,6 +309,11 @@ def setup(
309
)
310
elif backend == "vllm":
311
generation_config = cast(VllmConfig, generation_config)
312
+ if generation_config["vllm_cfg"]["precision"] == "fp8":
313
+ assert loss_config["use_importance_sampling_correction"] is True, (
314
+ "Importance sampling must be enabled for vLLM FP8 generation!"
315
+ )
316
+
317
policy_generation = VllmGeneration(
318
cluster=inference_cluster, config=generation_config
319
0 commit comments