Skip to content

Commit 17a6293

Browse files
authored
Merge branch 'main' into video_nvdec_fix
2 parents fcdb67c + 4bd1d85 commit 17a6293

File tree

3 files changed

+2
-5
lines changed

3 files changed

+2
-5
lines changed

nemo_curator/stages/text/io/writer/__init__.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,11 +13,9 @@
1313
# limitations under the License.
1414

1515
from nemo_curator.stages.text.io.writer.jsonl import JsonlWriter
16-
from nemo_curator.stages.text.io.writer.megatron_tokenizer import MegatronTokenizerWriter
1716
from nemo_curator.stages.text.io.writer.parquet import ParquetWriter
1817

1918
__all__ = [
2019
"JsonlWriter",
21-
"MegatronTokenizerWriter",
2220
"ParquetWriter",
2321
]

tests/stages/text/io/writer/test_megatron_tokenizer.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,8 +24,7 @@
2424
import pytest
2525

2626
import nemo_curator.stages.text.io.writer.utils as writer_utils
27-
from nemo_curator.stages.text.io.writer import MegatronTokenizerWriter
28-
from nemo_curator.stages.text.io.writer.megatron_tokenizer import _INDEX_HEADER
27+
from nemo_curator.stages.text.io.writer.megatron_tokenizer import _INDEX_HEADER, MegatronTokenizerWriter
2928
from nemo_curator.tasks import DocumentBatch
3029

3130

tutorials/text/megatron-tokenizer/main.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
from nemo_curator.core.client import RayClient
2323
from nemo_curator.pipeline import Pipeline
2424
from nemo_curator.stages.text.io.reader import ParquetReader
25-
from nemo_curator.stages.text.io.writer import MegatronTokenizerWriter
25+
from nemo_curator.stages.text.io.writer.megatron_tokenizer import MegatronTokenizerWriter
2626

2727

2828
def main(args: argparse.Namespace) -> None:

0 commit comments

Comments
 (0)