diff --git a/scripts/performance/perf_plugins.py b/scripts/performance/perf_plugins.py index 7bbd090497..b94341161d 100644 --- a/scripts/performance/perf_plugins.py +++ b/scripts/performance/perf_plugins.py @@ -307,6 +307,11 @@ def _set_model_specific_environment_variables( if "NVTE_NORM_BWD_USE_CUDNN" in executor.env_vars: executor.env_vars.pop("NVTE_NORM_BWD_USE_CUDNN") + if model_recipe_name in ["nemotron_3_nano"] and compute_dtype == "nvfp4": + executor.env_vars["NVTE_NVFP4_DISABLE_RHT"] = "1" + executor.env_vars["NVTE_NVFP4_DISABLE_STOCHASTIC_ROUNDING"] = "1" + executor.env_vars["NVTE_NVFP4_DISABLE_2D_QUANTIZATION"] = "1" + def _set_layernorm_sm_margin( self, task: Union["run.Partial", "run.Script"],