Python Module Index b | c | d | f | i | m | n | p | s | t | u b backends backends.base backends.experimental backends.experimental.ray_actor_pool backends.experimental.ray_actor_pool.adapter backends.experimental.ray_actor_pool.executor backends.experimental.ray_actor_pool.raft_adapter backends.experimental.ray_actor_pool.shuffle_adapter backends.experimental.ray_actor_pool.utils backends.experimental.ray_data backends.experimental.ray_data.adapter backends.experimental.ray_data.executor backends.experimental.ray_data.utils backends.experimental.utils backends.internal backends.internal.raft backends.internal.raft.ray_comms backends.utils backends.xenna backends.xenna.adapter backends.xenna.executor c classifiers classifiers.aegis classifiers.base classifiers.content_type classifiers.domain classifiers.fineweb_edu classifiers.prompt_task_complexity classifiers.quality d datasets datasets.doc_dataset datasets.image_text_pair_dataset datasets.parallel_dataset download download.arxiv download.commoncrawl download.doc_builder download.ja_stopwords download.th_stopwords download.wikipedia download.zh_stopwords f filters filters.bitext_filter filters.classifier_filter filters.code filters.doc_filter filters.heuristic_filter filters.models filters.models.qe_models filters.synthetic i image image.classifiers image.classifiers.aesthetic image.classifiers.base image.classifiers.nsfw image.embedders image.embedders.base image.embedders.timm m modifiers modifiers.async_llm_pii_modifier modifiers.c4 modifiers.doc_modifier modifiers.fasttext modifiers.line_remover modifiers.llm_pii_modifier modifiers.markdown_remover modifiers.newline_normalizer modifiers.pii_modifier modifiers.quotation_remover modifiers.slicer modifiers.unicode_reformatter modifiers.url_remover modules modules.add_id modules.base modules.config modules.dataset_ops modules.exact_dedup modules.filter modules.fuzzy_dedup modules.fuzzy_dedup.bucketstoedges modules.fuzzy_dedup.connectedcomponents modules.fuzzy_dedup.fuzzyduplicates modules.fuzzy_dedup.jaccardsimilarity modules.fuzzy_dedup.lsh modules.fuzzy_dedup.minhash modules.joiner modules.meta modules.modify modules.semantic_dedup modules.semantic_dedup.clusteringmodel modules.semantic_dedup.embeddings modules.semantic_dedup.semanticclusterleveldedup modules.semantic_dedup.semdedup modules.splitter modules.task modules.to_backend n nemo_run nemo_run.slurm p pii pii.algorithm pii.constants pii.custom_batch_analyzer_engine pii.custom_nlp_engine pii.recognizers pii.recognizers.address_recognizer pipeline pipeline.pipeline s services services.conversation_formatter services.model_client services.nemo_client services.openai_client stages stages.audio stages.audio.common stages.audio.datasets stages.audio.datasets.file_utils stages.audio.datasets.fleurs stages.audio.datasets.fleurs.create_initial_manifest stages.audio.inference stages.audio.inference.asr_nemo stages.audio.io stages.audio.io.convert stages.audio.metrics stages.audio.metrics.get_wer stages.base stages.client_partitioning stages.deduplication stages.deduplication.exact stages.deduplication.exact.identification stages.deduplication.exact.workflow stages.deduplication.fuzzy stages.deduplication.fuzzy.buckets_to_edges stages.deduplication.fuzzy.connected_components stages.deduplication.fuzzy.identify_duplicates stages.deduplication.fuzzy.lsh stages.deduplication.fuzzy.lsh.lsh stages.deduplication.fuzzy.lsh.stage stages.deduplication.fuzzy.minhash stages.deduplication.fuzzy.utils stages.deduplication.fuzzy.workflow stages.deduplication.gpu_utils stages.deduplication.id_generator stages.deduplication.io_utils stages.deduplication.semantic stages.deduplication.semantic.identify_duplicates stages.deduplication.semantic.kmeans stages.deduplication.semantic.pairwise stages.deduplication.semantic.pairwise_io stages.deduplication.semantic.ranking stages.deduplication.semantic.utils stages.deduplication.semantic.workflow stages.deduplication.shuffle_utils stages.deduplication.shuffle_utils.rapidsmpf_shuffler stages.deduplication.shuffle_utils.stage stages.file_partitioning stages.function_decorators stages.image stages.image.deduplication stages.image.deduplication.removal stages.image.embedders stages.image.embedders.clip_embedder stages.image.filters stages.image.filters.aesthetic_filter stages.image.filters.base stages.image.filters.nsfw_filter stages.image.io stages.image.io.convert stages.image.io.image_reader stages.image.io.image_writer stages.resources stages.synthetic stages.synthetic.nemotron_cc stages.synthetic.nemotron_cc.base stages.synthetic.nemotron_cc.nemotron_cc stages.synthetic.nemotron_cc.prompts stages.synthetic.qa_multilingual_synthetic stages.text stages.text.classifiers stages.text.classifiers.aegis stages.text.classifiers.aegis_utils stages.text.classifiers.base stages.text.classifiers.constants stages.text.classifiers.content_type stages.text.classifiers.domain stages.text.classifiers.fineweb_edu stages.text.classifiers.prompt_task_complexity stages.text.classifiers.quality stages.text.deduplication stages.text.deduplication.removal stages.text.deduplication.removal_workflow stages.text.deduplication.semantic stages.text.download stages.text.download.arxiv stages.text.download.arxiv.download stages.text.download.arxiv.extract stages.text.download.arxiv.iterator stages.text.download.arxiv.stage stages.text.download.arxiv.url_generation stages.text.download.base stages.text.download.base.download stages.text.download.base.extract stages.text.download.base.iterator stages.text.download.base.stage stages.text.download.base.url_generation stages.text.download.common_crawl stages.text.download.common_crawl.download stages.text.download.common_crawl.extract stages.text.download.common_crawl.stage stages.text.download.common_crawl.url_generation stages.text.download.common_crawl.warc_iterator stages.text.download.html_extractors stages.text.download.html_extractors.base stages.text.download.html_extractors.justext stages.text.download.html_extractors.resiliparse stages.text.download.html_extractors.trafilatura stages.text.download.html_extractors.utils stages.text.download.html_extractors.utils.ja_stopwords stages.text.download.html_extractors.utils.th_stopwords stages.text.download.html_extractors.utils.zh_stopwords stages.text.download.utils stages.text.download.wikipedia stages.text.download.wikipedia.download stages.text.download.wikipedia.extract stages.text.download.wikipedia.iterator stages.text.download.wikipedia.stage stages.text.download.wikipedia.url_generation stages.text.embedders stages.text.embedders.base stages.text.embedders.utils stages.text.filters stages.text.filters.code stages.text.filters.doc_filter stages.text.filters.fasttext_filter stages.text.filters.heuristic_filter stages.text.io stages.text.io.reader stages.text.io.reader.base stages.text.io.reader.jsonl stages.text.io.reader.parquet stages.text.io.writer stages.text.io.writer.base stages.text.io.writer.jsonl stages.text.io.writer.megatron_tokenizer stages.text.io.writer.parquet stages.text.io.writer.utils stages.text.models stages.text.models.model stages.text.models.tokenizer stages.text.models.utils stages.text.modifiers stages.text.modifiers.c4 stages.text.modifiers.doc_modifier stages.text.modifiers.fasttext stages.text.modifiers.line_remover stages.text.modifiers.markdown_remover stages.text.modifiers.newline_normalizer stages.text.modifiers.quotation_remover stages.text.modifiers.slicer stages.text.modifiers.unicode_reformatter stages.text.modifiers.url_remover stages.text.modules stages.text.modules.add_id stages.text.modules.joiner stages.text.modules.modifier stages.text.modules.score_filter stages.text.modules.splitter stages.text.utils stages.text.utils.constants stages.text.utils.text_utils stages.video stages.video.caption stages.video.caption.caption_enhancement stages.video.caption.caption_generation stages.video.caption.caption_preparation stages.video.clipping stages.video.clipping.clip_extraction_stages stages.video.clipping.clip_frame_extraction stages.video.clipping.transnetv2_extraction stages.video.clipping.video_frame_extraction stages.video.embedding stages.video.embedding.cosmos_embed1 stages.video.filtering stages.video.filtering.clip_aesthetic_filter stages.video.filtering.motion_filter stages.video.filtering.motion_vector_backend stages.video.io stages.video.io.clip_writer stages.video.io.video_reader stages.video.preview stages.video.preview.preview synthetic synthetic.async_nemotron synthetic.async_nemotron_cc synthetic.error synthetic.generator synthetic.mixtral synthetic.nemotron synthetic.nemotron_cc synthetic.no_format synthetic.prompts t tasks tasks.audio_batch tasks.document tasks.file_group tasks.image tasks.tasks tasks.utils tasks.video u utils utils.client_utils utils.column_utils utils.decoder_utils utils.file_utils utils.grouping utils.hf_download_utils utils.nvcodec_utils utils.operation_utils utils.performance_utils utils.split_large_files utils.storage_utils utils.windowing_utils utils.writer_utils