diff --git a/scripts/evaluation_with_nemo_run.py b/scripts/evaluation_with_nemo_run.py index 92ffed4f..e827a94d 100644 --- a/scripts/evaluation_with_nemo_run.py +++ b/scripts/evaluation_with_nemo_run.py @@ -237,6 +237,8 @@ def slurm_executor( if custom_env_vars: env_vars |= custom_env_vars + # Recommended to use this over run.Packager() as it can lead to fiddle serialization errors importing + # 'wait_and_evaluate' method from 'helpers' packager = run.Config(run.GitArchivePackager, subpath="scripts") executor = run.SlurmExecutor( @@ -304,17 +306,18 @@ def main(): deploy_script = TRITON_DEPLOY_SCRIPT.format( **commons_args, additional_args=additional_args ) + deploy_run_script = run.Script(inline=deploy_script) elif args.serving_backend == "ray": if args.num_cpus_per_replica: additional_args += f" --num_cpus_per_replica {args.num_cpus_per_replica}" deploy_script = RAY_DEPLOY_SCRIPT.format( **commons_args, additional_args=additional_args ) + deploy_run_script = run.Script(inline=deploy_script, metadata={"use_with_ray_cluster": True}) else: raise ValueError(f"Invalid serving backend: {args.serving_backend}") - print(deploy_script) - deploy_run_script = run.Script(inline=deploy_script) + print(deploy_script) api_endpoint = run.Config( ApiEndpoint,