diff --git a/.github/workflows/cicd-main-export-deploy.yml b/.github/workflows/cicd-main-export-deploy.yml deleted file mode 100644 index 0e3f9a6d43b7..000000000000 --- a/.github/workflows/cicd-main-export-deploy.yml +++ /dev/null @@ -1,115 +0,0 @@ -# Copyright (c) 2025, NVIDIA CORPORATION. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. -name: NeMo E2E Export Deploy Tests -on: - workflow_call: - inputs: - test_to_run: - required: true - type: string - image-name: - required: false - default: nemo_container_export_deploy - type: string - -jobs: - build: - uses: ./.github/workflows/_build_container.yml - with: - image-name: ${{ inputs.image-name }} - dockerfile: docker/Dockerfile.ci.export_deploy - - unit-tests: - strategy: - fail-fast: false - matrix: - include: - - script: L0_Unit_Tests_GPU_Export_Deploy - runner: self-hosted-azure - is-optional: true - - script: L0_Unit_Tests_CPU_Export_Deploy - runner: self-hosted-azure-cpu - cpu-only: true - - script: L0_Unit_Tests_Eval_Legacy - runner: self-hosted-azure - - script: L0_Unit_Tests_Eval - runner: self-hosted-azure - - script: L0_Unit_Tests_Eval_Adapters - runner: self-hosted-azure - needs: [build] - runs-on: ${{ matrix.runner }} - name: ${{ matrix.is-optional && 'PLEASEFIXME_' || '' }}${{ matrix.script }} - steps: - - name: Checkout - uses: actions/checkout@v4 - with: - path: ${{ github.run_id }} - - name: main - uses: NVIDIA/NeMo/.github/actions/test-template@main - with: - runner: ${{ runner.name }} - script: ${{ matrix.script }} - is_unit_test: true - tests_to_run: ${{ inputs.test_to_run }} - image: ${{ inputs.image-name }} - cpu-only: ${{ matrix.cpu-only || false }} - is_optional: ${{ matrix.is-optional || false }} - e2e-tests: - strategy: - fail-fast: false - matrix: - include: - # Export tests - - script: L2_NeMo_2_Export_HF_TRT_LLM - runner: self-hosted-azure - - script: L2_NeMo_2_Export_Deploy_Query_In_Framework - runner: self-hosted-azure - is-optional: true - - script: L2_ONNX_TRT_LLM_Embedding_Export - runner: self-hosted-azure - is-optional: true - - script: L2_NeMo_2_Export_TRT_LLM - runner: self-hosted-azure - - script: L2_NeMo_2_vLLM_Export_Llama - runner: self-hosted-azure - - script: L2_NeMo_2_vLLM_Export_Mixtral - runner: self-hosted-azure - - script: L2_NeMo_2_Export_In_Framework - runner: self-hosted-azure - - script: L2_NeMo_2_Export_Qnemo_TRT_LLM - runner: self-hosted-azure - - script: L2_NeMo_2_VLLM_VISION - runner: self-hosted-azure - - script: L2_NeMo_2_EVAL_Legacy - runner: self-hosted-azure-gpus-1 - - script: L2_NeMo_2_EVAL_gsm8k - runner: self-hosted-azure-gpus-1 - - script: L2_NeMo_2_EVAL_arcc - runner: self-hosted-azure-gpus-1 - needs: [unit-tests] - runs-on: ${{ matrix.runner }} - name: ${{ matrix.is-optional && 'PLEASEFIXME_' || '' }}${{ matrix.script }} - steps: - - name: Checkout - uses: actions/checkout@v4 - with: - path: ${{ github.run_id }} - - name: main - uses: NVIDIA/NeMo/.github/actions/test-template@main - with: - runner: ${{ runner.name }} - script: ${{ matrix.script }} - tests_to_run: ${{ inputs.test_to_run }} - image: ${{ inputs.image-name }} - is_optional: ${{ matrix.is-optional || false }} diff --git a/.github/workflows/cicd-main.yml b/.github/workflows/cicd-main.yml index e2c7d314f3a8..dffbee9694a7 100644 --- a/.github/workflows/cicd-main.yml +++ b/.github/workflows/cicd-main.yml @@ -253,27 +253,6 @@ jobs: with: test_to_run: ${{ needs.pre-flight.outputs.test_to_run }} - cicd-main-export-deploy: - needs: [pre-flight, cicd-test-container-build, cicd-main-unit-tests] - uses: ./.github/workflows/cicd-main-export-deploy.yml - if: | - ( - needs.pre-flight.outputs.test_to_run != '[]' - && ( - contains(fromJson(needs.pre-flight.outputs.components_to_run), 'export-deploy') - ) - ) - && ( - success() - || ( - needs.cicd-wait-in-queue.result == 'skipped' - && needs.pre-flight.outputs.is_ci_workload == 'true' - ) - ) - && !cancelled() - with: - test_to_run: ${{ needs.pre-flight.outputs.test_to_run }} - cicd-main-speech: needs: [pre-flight, cicd-test-container-build, cicd-main-unit-tests] uses: ./.github/workflows/cicd-main-speech.yml @@ -346,7 +325,6 @@ jobs: - L0_Setup_Test_Data_And_Models - cicd-main-unit-tests - cicd-main-nemo2 - - cicd-main-export-deploy - cicd-main-automodel - cicd-main-speech if: always() diff --git a/nemo/collections/llm/api.py b/nemo/collections/llm/api.py index d47dc842c13b..96dcd1dca6a8 100644 --- a/nemo/collections/llm/api.py +++ b/nemo/collections/llm/api.py @@ -603,6 +603,12 @@ def deploy( enable_flash_decode: bool = True, legacy_ckpt: bool = False, ): + warnings.warn( + "The 'deploy' function is deprecated and will be removed in NeMo FW 25.09 container release. " + "For evaluation functionality, please use the new Eval repository: https://github.com/NVIDIA-NeMo/Eval", + DeprecationWarning, + stacklevel=2, + ) """ Deploys nemo model on a PyTriton server either "in-framework" or by converting to trtllm depending on the backend. This deploy method is intended to be used for evaluation. @@ -791,6 +797,12 @@ def evaluate( eval_cfg: EvaluationConfig = EvaluationConfig(type="gsm8k"), adapter_cfg: AdapterConfig | None = None, ) -> dict: + warnings.warn( + "The 'evaluate' function is deprecated and will be removed in NeMo FW 25.09 container release. " + "For evaluation functionality, please use the new Eval repository: https://github.com/NVIDIA-NeMo/Eval", + DeprecationWarning, + stacklevel=2, + ) """ Evaluates nemo model deployed on PyTriton server using nvidia-lm-eval diff --git a/nemo/deploy/__init__.py b/nemo/deploy/__init__.py index 35503fe54339..2859fd065711 100644 --- a/nemo/deploy/__init__.py +++ b/nemo/deploy/__init__.py @@ -13,6 +13,15 @@ # limitations under the License. -from nemo.deploy.deploy_base import DeployBase -from nemo.deploy.deploy_pytriton import DeployPyTriton -from nemo.deploy.triton_deployable import ITritonDeployable +import warnings + +from nemo.deploy.deploy_base import DeployBase # noqa: F401 +from nemo.deploy.deploy_pytriton import DeployPyTriton # noqa: F401 +from nemo.deploy.triton_deployable import ITritonDeployable # noqa: F401 + +warnings.warn( + "The 'nemo.deploy' is deprecated and will be removed in NeMo FW 25.09 container release. " + "For evaluation functionality, please use the new Eval repository: https://github.com/NVIDIA-NeMo/Export-Deploy", + DeprecationWarning, + stacklevel=2, +) diff --git a/nemo/export/__init__.py b/nemo/export/__init__.py index 9cbd9d4f3e0a..1a5e5f6afd5c 100644 --- a/nemo/export/__init__.py +++ b/nemo/export/__init__.py @@ -19,3 +19,12 @@ __all__ = ["io"] except (ImportError, ModuleNotFoundError): pass + +import warnings + +warnings.warn( + "The 'nemo.export' is deprecated and will be removed in NeMo FW 25.09 container release. " + "For evaluation functionality, please use the new Eval repository: https://github.com/NVIDIA-NeMo/Export-Deploy", + DeprecationWarning, + stacklevel=2, +) diff --git a/scripts/llm/evaluation.py b/scripts/llm/evaluation.py index 0f6307b1e663..e8b191b97b94 100644 --- a/scripts/llm/evaluation.py +++ b/scripts/llm/evaluation.py @@ -12,11 +12,22 @@ # See the License for the specific language governing permissions and # limitations under the License. +import warnings + +warnings.warn( + "This evaluation script is deprecated and will be removed in NeMo FW 25.09 container release. " + "For evaluation functionality, please use the new Eval repository: https://github.com/NVIDIA-NeMo/Eval", + DeprecationWarning, + stacklevel=1, +) + # NOTE: This script is only an example of using NeMo with NeMo-Run's APIs and is subject to change without notice. # This script is used for evaluation on local and slurm executors using NeMo-Run. # It uses deploy method from nemo/llm/collections/api.py to deploy nemo2.0 ckpt on PyTriton server and uses evaluate # method from nemo/llm/collections/api.py to run evaluation on it. # (https://github.com/NVIDIA/NeMo-Run) to configure and execute the runs. +# DEPRECATED: This script and the underlying deploy/evaluate functions will be removed in NeMo FW 25.09. +# Please use the new Eval repository: https://github.com/NVIDIA-NeMo/Eval import argparse from typing import Optional