NVIDIA-NeMo
diff --git a/‎dfm/src/common/models/__init__ .py‎ ‎dfm/src/common/tokenizers/__init__ .py‎dfm/src/common/models/__init__ .py renamed to dfm/src/common/tokenizers/__init__ .py b/‎dfm/src/common/models/__init__ .py‎ ‎dfm/src/common/tokenizers/__init__ .py‎dfm/src/common/models/__init__ .py renamed to dfm/src/common/tokenizers/__init__ .py
diff --git a/‎dfm/src/common/models/cosmos/__init__.py‎ ‎…src/common/tokenizers/cosmos/__init__.py‎dfm/src/common/models/cosmos/__init__.py renamed to dfm/src/common/tokenizers/cosmos/__init__.py b/‎dfm/src/common/models/cosmos/__init__.py‎ ‎…src/common/tokenizers/cosmos/__init__.py‎dfm/src/common/models/cosmos/__init__.py renamed to dfm/src/common/tokenizers/cosmos/__init__.py
diff --git a/‎…common/models/cosmos/cosmos1/__init__.py‎ ‎…on/tokenizers/cosmos/cosmos1/__init__.py‎dfm/src/common/models/cosmos/cosmos1/__init__.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/__init__.py b/‎…common/models/cosmos/cosmos1/__init__.py‎ ‎…on/tokenizers/cosmos/cosmos1/__init__.py‎dfm/src/common/models/cosmos/cosmos1/__init__.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/__init__.py
diff --git a/‎…cosmos/cosmos1/causal_video_tokenizer.py‎ ‎…cosmos/cosmos1/causal_video_tokenizer.py‎dfm/src/common/models/cosmos/cosmos1/causal_video_tokenizer.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/causal_video_tokenizer.py
Lines changed: 1 addition & 1 deletion b/‎…cosmos/cosmos1/causal_video_tokenizer.py‎ ‎…cosmos/cosmos1/causal_video_tokenizer.py‎dfm/src/common/models/cosmos/cosmos1/causal_video_tokenizer.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/causal_video_tokenizer.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎…models/cosmos/cosmos1/tokenizer_utils.py‎ ‎…/cosmos/cosmos1/video_tokenizer_utils.py‎dfm/src/common/models/cosmos/cosmos1/tokenizer_utils.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/video_tokenizer_utils.py b/‎…models/cosmos/cosmos1/tokenizer_utils.py‎ ‎…/cosmos/cosmos1/video_tokenizer_utils.py‎dfm/src/common/models/cosmos/cosmos1/tokenizer_utils.py renamed to dfm/src/common/tokenizers/cosmos/cosmos1/video_tokenizer_utils.py
diff --git a/‎dfm/src/common/utils/save_video.py‎
Lines changed: 0 additions & 10 deletions b/‎dfm/src/common/utils/save_video.py‎
Lines changed: 0 additions & 10 deletions
diff --git a/‎dfm/src/megatron/data/common/__init__.py‎ b/‎dfm/src/megatron/data/common/__init__.py‎
diff --git a/‎…tron/data/dit/base_energon_datamodule.py‎ ‎…n/data/common/base_energon_datamodule.py‎dfm/src/megatron/data/dit/base_energon_datamodule.py renamed to dfm/src/megatron/data/common/base_energon_datamodule.py
Lines changed: 1 addition & 1 deletion b/‎…tron/data/dit/base_energon_datamodule.py‎ ‎…n/data/common/base_energon_datamodule.py‎dfm/src/megatron/data/dit/base_energon_datamodule.py renamed to dfm/src/megatron/data/common/base_energon_datamodule.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎…data/dit/diffusion_energon_datamodule.py‎ ‎…a/common/diffusion_energon_datamodule.py‎dfm/src/megatron/data/dit/diffusion_energon_datamodule.py renamed to dfm/src/megatron/data/common/diffusion_energon_datamodule.py
Lines changed: 1 addition & 1 deletion b/‎…data/dit/diffusion_energon_datamodule.py‎ ‎…a/common/diffusion_energon_datamodule.py‎dfm/src/megatron/data/dit/diffusion_energon_datamodule.py renamed to dfm/src/megatron/data/common/diffusion_energon_datamodule.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎…rc/megatron/data/dit/diffusion_sample.py‎ ‎…megatron/data/common/diffusion_sample.py‎dfm/src/megatron/data/dit/diffusion_sample.py renamed to dfm/src/megatron/data/common/diffusion_sample.py b/‎…rc/megatron/data/dit/diffusion_sample.py‎ ‎…megatron/data/common/diffusion_sample.py‎dfm/src/megatron/data/dit/diffusion_sample.py renamed to dfm/src/megatron/data/common/diffusion_sample.py
@@ -25,7 +25,7 @@
 from huggingface_hub import hf_hub_download
 from tqdm import tqdm
 
-from dfm.src.common.models.cosmos.cosmos1.tokenizer_utils import (
+from dfm.src.common.tokenizers.cosmos.cosmos1.video_tokenizer_utils import (
     load_jit_model,
     numpy2tensor,
     pad_video_batch,
 
@@ -14,7 +14,6 @@
 
 import imageio
 import numpy as np
-import torch
 
 
 def save_video(
@@ -35,12 +34,3 @@ def save_video(
 
     print("video_save_path", video_save_path)
     imageio.mimsave(video_save_path, grid, "mp4", **kwargs)
-
-
-def print_dict(dict):
-    for key, value in dict.items():
-        if isinstance(value, torch.Tensor):
-            print(key, value.shape)
-        else:
-            print(key, value)
-    print("-" * 40)
@@ -24,7 +24,7 @@
 
 class EnergonMultiModalDataModule:
     """
-    A PyTorch Lightning DataModule for handling multimodal datasets with images and text.
+    A DataModule for handling multimodal datasets with images and text.
 
     This data module is designed to work with multimodal datasets that involve both images and text.
     It provides a seamless interface to load training and validation data, manage batching, and handle
 
@@ -23,7 +23,7 @@
 from megatron.energon import DefaultTaskEncoder, get_train_dataset
 from torch import int_repr
 
-from dfm.src.megatron.data.dit.base_energon_datamodule import EnergonMultiModalDataModule
+from dfm.src.megatron.data.common.base_energon_datamodule import EnergonMultiModalDataModule
 from dfm.src.megatron.data.dit.dit_taskencoder import DiTTaskEncoder