nemo_automodel.components.datasets.diffusion.meta_files_dataset#
Module Contents#
Classes#
PyTorch dataset for WAN2.1 |
Functions#
Data#
API#
- nemo_automodel.components.datasets.diffusion.meta_files_dataset.logger#
‘getLogger(…)’
- class nemo_automodel.components.datasets.diffusion.meta_files_dataset.MetaFilesDataset(
- meta_folder: str,
- transform_text: Optional[Callable[[torch.Tensor], torch.Tensor]] = None,
- transform_video: Optional[Callable[[torch.Tensor], torch.Tensor]] = None,
- filter_fn: Optional[Callable[[Dict], bool]] = None,
- device: str = 'cpu',
- max_files: Optional[int] = None,
Bases:
torch.utils.data.DatasetPyTorch dataset for WAN2.1
.metafiles.Initialization
- _log_dataset_stats() None#
- __len__() int#
- __getitem__(index: int) Dict[str, torch.Tensor]#
- nemo_automodel.components.datasets.diffusion.meta_files_dataset.collate_fn(
- batch: List[Dict[str, torch.Tensor]],
- nemo_automodel.components.datasets.diffusion.meta_files_dataset.build_node_parallel_sampler(
- dataset: torch.utils.data.Dataset,
- dp_rank: int,
- dp_world_size: int,
- shuffle: bool = True,
- nemo_automodel.components.datasets.diffusion.meta_files_dataset.build_dataloader(
- *,
- meta_folder: str,
- batch_size: int,
- dp_rank: int,
- dp_world_size: int,
- shuffle: bool = True,
- num_workers: int = 2,
- device: str = 'cpu',
- transform_text: Optional[Callable[[torch.Tensor], torch.Tensor]] = None,
- transform_video: Optional[Callable[[torch.Tensor], torch.Tensor]] = None,
- filter_fn: Optional[Callable[[Dict], bool]] = None,
- max_files: Optional[int] = None,
- nemo_automodel.components.datasets.diffusion.meta_files_dataset.create_dataloader(
- meta_folder: str,
- batch_size: int,
- num_nodes: int,