Skip to content

Commit d858650

Browse files
Move nlp folder to llm folder (#439)
Signed-off-by: Onur Yilmaz <oyilmaz@nvidia.com> Signed-off-by: Pablo Garay <pagaray@nvidia.com> Co-authored-by: Pablo Garay <pagaray@nvidia.com>
1 parent 2b698b6 commit d858650

34 files changed

+190
-163
lines changed

nemo_deploy/deploy_ray.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,8 +25,8 @@
2525
import ray
2626
from ray import serve
2727

28-
from nemo_deploy.nlp.hf_deployable_ray import HFRayDeployable
29-
from nemo_deploy.nlp.megatronllm_deployable_ray import MegatronRayDeployable
28+
from nemo_deploy.llm.hf_deployable_ray import HFRayDeployable
29+
from nemo_deploy.llm.megatronllm_deployable_ray import MegatronRayDeployable
3030
from nemo_export.tensorrt_llm_deployable_ray import TensorRTLLMRayDeployable
3131

3232
HAVE_RAY = True
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
stacklevel=2,
2222
)
2323

24-
from nemo_deploy.nlp.query_llm import (
24+
from nemo_deploy.llm.query_llm import (
2525
NemoQueryLLM,
2626
NemoQueryLLMHF,
2727
NemoQueryLLMPyTorch,
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
from fastapi import FastAPI, HTTPException
2323
from ray import serve
2424

25-
from nemo_deploy.nlp.hf_deployable import HuggingFaceLLMDeploy
25+
from nemo_deploy.llm.hf_deployable import HuggingFaceLLMDeploy
2626
from nemo_deploy.ray_utils import find_available_port
2727

2828
LOGGER = logging.getLogger("NeMo")
Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
# Copyright (c) 2025, NVIDIA CORPORATION. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
15+
from nemo_deploy.llm.inference.inference_base import (
16+
create_mcore_engine,
17+
setup_megatron_model_and_tokenizer_for_inference,
18+
setup_model_and_tokenizer_for_inference,
19+
)
20+
from nemo_deploy.llm.inference.tron_utils import DistributedInitConfig, RNGConfig
21+
22+
__all__ = [
23+
"create_mcore_engine",
24+
"setup_model_and_tokenizer_for_inference",
25+
"setup_megatron_model_and_tokenizer_for_inference",
26+
"DistributedInitConfig",
27+
"RNGConfig",
28+
]
File renamed without changes.
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
from megatron.core.inference.inference_request import InferenceRequest
2626

2727
from nemo_deploy import ITritonDeployable
28-
from nemo_deploy.nlp.inference.inference_base import create_mcore_engine
28+
from nemo_deploy.llm.inference.inference_base import create_mcore_engine
2929
from nemo_deploy.utils import (
3030
NEMO2,
3131
broadcast_list,
File renamed without changes.

0 commit comments

Comments
 (0)