Python Module Index

c
 
c
core
    core.activations
    core.config
    core.config_logger
    core.datasets
    core.datasets.bert_dataset
    core.datasets.blended_dataset
    core.datasets.blended_megatron_dataset_builder
    core.datasets.blended_megatron_dataset_config
    core.datasets.gpt_dataset
    core.datasets.helpers
    core.datasets.indexed_dataset
    core.datasets.masked_dataset
    core.datasets.megatron_dataset
    core.datasets.megatron_tokenizer
    core.datasets.multimodal_dataset
    core.datasets.object_storage_utils
    core.datasets.retro
    core.datasets.retro.config
    core.datasets.retro.config.bert_embedders
    core.datasets.retro.config.config
    core.datasets.retro.config.gpt_chunk_datasets
    core.datasets.retro.config.tokenizers
    core.datasets.retro.db
    core.datasets.retro.db.build
    core.datasets.retro.db.dataset
    core.datasets.retro.db.utils
    core.datasets.retro.external_libs
    core.datasets.retro.index
    core.datasets.retro.index.build
    core.datasets.retro.index.factory
    core.datasets.retro.index.index
    core.datasets.retro.index.indexes
    core.datasets.retro.index.indexes.faiss_base
    core.datasets.retro.index.indexes.faiss_par_add
    core.datasets.retro.index.utils
    core.datasets.retro.index.validate
    core.datasets.retro.query
    core.datasets.retro.query.gpt_chunk_dataset
    core.datasets.retro.query.multi_split_gpt_dataset
    core.datasets.retro.query.query
    core.datasets.retro.query.retro_dataset
    core.datasets.retro.query.utils
    core.datasets.retro.utils
    core.datasets.t5_dataset
    core.datasets.utils
    core.datasets.utils_s3
    core.dist_checkpointing
    core.dist_checkpointing.core
    core.dist_checkpointing.dict_utils
    core.dist_checkpointing.exchange_utils
    core.dist_checkpointing.mapping
    core.dist_checkpointing.optimizer
    core.dist_checkpointing.serialization
    core.dist_checkpointing.state_dict_utils
    core.dist_checkpointing.strategies
    core.dist_checkpointing.strategies.async_utils
    core.dist_checkpointing.strategies.base
    core.dist_checkpointing.strategies.cached_metadata_filesystem_reader
    core.dist_checkpointing.strategies.checkpointable
    core.dist_checkpointing.strategies.common
    core.dist_checkpointing.strategies.filesystem_async
    core.dist_checkpointing.strategies.fully_parallel
    core.dist_checkpointing.strategies.state_dict_saver
    core.dist_checkpointing.strategies.tensorstore
    core.dist_checkpointing.strategies.torch
    core.dist_checkpointing.strategies.two_stage
    core.dist_checkpointing.strategies.zarr
    core.dist_checkpointing.tensor_aware_state_dict
    core.dist_checkpointing.utils
    core.dist_checkpointing.validation
    core.distributed
    core.distributed.data_parallel_base
    core.distributed.distributed_data_parallel
    core.distributed.distributed_data_parallel_config
    core.distributed.finalize_model_grads
    core.distributed.fsdp
    core.distributed.fsdp.mcore_fsdp_adapter
    core.distributed.fsdp.src
    core.distributed.fsdp.src.megatron_fsdp
    core.distributed.fsdp.src.megatron_fsdp.distributed_data_parallel_config
    core.distributed.fsdp.src.megatron_fsdp.fully_shard
    core.distributed.fsdp.src.megatron_fsdp.megatron_fsdp
    core.distributed.fsdp.src.megatron_fsdp.package_info
    core.distributed.fsdp.src.megatron_fsdp.param_and_grad_buffer
    core.distributed.fsdp.src.megatron_fsdp.uneven_dtensor
    core.distributed.fsdp.src.megatron_fsdp.utils
    core.distributed.param_and_grad_buffer
    core.distributed.reduce_scatter_with_fp32_accumulation
    core.distributed.torch_fully_sharded_data_parallel
    core.distributed.torch_fully_sharded_data_parallel_config
    core.energy_monitor
    core.enums
    core.export
    core.export.data_type
    core.export.export_config
    core.export.model_type
    core.export.trtllm
    core.export.trtllm.engine_builder
    core.export.trtllm.engine_builder.trtllm_engine_builder
    core.export.trtllm.model_to_trllm_mapping
    core.export.trtllm.model_to_trllm_mapping.default_conversion_dict
    core.export.trtllm.trt_model_config
    core.export.trtllm.trt_model_type
    core.export.trtllm.trtllm_helper
    core.export.trtllm.trtllm_layers
    core.export.trtllm.trtllm_weights_converter
    core.export.trtllm.trtllm_weights_converter.distributed_trtllm_model_weights_converter
    core.export.trtllm.trtllm_weights_converter.single_device_trtllm_model_weights_converter
    core.export.trtllm.trtllm_weights_converter.utils
    core.extensions
    core.extensions.kitchen
    core.extensions.transformer_engine
    core.extensions.transformer_engine_spec_provider
    core.fp4_utils
    core.fp8_utils
    core.full_cuda_graph
    core.fusions
    core.fusions.fused_bias_dropout
    core.fusions.fused_bias_geglu
    core.fusions.fused_bias_gelu
    core.fusions.fused_bias_swiglu
    core.fusions.fused_cross_entropy
    core.fusions.fused_indices_converter
    core.fusions.fused_layer_norm
    core.fusions.fused_mla_yarn_rope_apply
    core.fusions.fused_pad_routing_map
    core.fusions.fused_softmax
    core.fusions.fused_weighted_squared_relu
    core.hyper_comm_grid
    core.inference
    core.inference.async_stream
    core.inference.batch_dimensions_utils
    core.inference.common_inference_params
    core.inference.communication_utils
    core.inference.contexts
    core.inference.contexts.base_context
    core.inference.contexts.dynamic_block_allocator
    core.inference.contexts.dynamic_context
    core.inference.contexts.fused_kv_append_kernel
    core.inference.contexts.static_context
    core.inference.data_parallel_inference_coordinator
    core.inference.engines
    core.inference.engines.abstract_engine
    core.inference.engines.async_zmq_communicator
    core.inference.engines.dynamic_engine
    core.inference.engines.mcore_engine
    core.inference.engines.static_engine
    core.inference.headers
    core.inference.inference_client
    core.inference.inference_request
    core.inference.model_inference_wrappers
    core.inference.model_inference_wrappers.abstract_model_inference_wrapper
    core.inference.model_inference_wrappers.gpt
    core.inference.model_inference_wrappers.gpt.gpt_inference_wrapper
    core.inference.model_inference_wrappers.inference_wrapper_config
    core.inference.model_inference_wrappers.t5
    core.inference.model_inference_wrappers.t5.t5_inference_wrapper
    core.inference.sampling_params
    core.inference.scheduler
    core.inference.text_generation_controllers
    core.inference.text_generation_controllers.encoder_decoder_text_generation_controller
    core.inference.text_generation_controllers.simple_text_generation_controller
    core.inference.text_generation_controllers.text_generation_controller
    core.inference.text_generation_controllers.vlm_text_generation_controller
    core.inference.text_generation_server
    core.inference.text_generation_server.run_mcore_engine
    core.inference.text_generation_server.text_generation_server
    core.inference.text_generation_server.tokenization
    core.inference.unified_memory
    core.inference.utils
    core.inference_params
    core.jit
    core.model_parallel_config
    core.models
    core.models.backends
    core.models.bert
    core.models.bert.bert_layer_specs
    core.models.bert.bert_lm_head
    core.models.bert.bert_model
    core.models.bert.pooler
    core.models.common
    core.models.common.embeddings
    core.models.common.embeddings.language_model_embedding
    core.models.common.embeddings.relative_pos_embedding
    core.models.common.embeddings.rope_utils
    core.models.common.embeddings.rotary_pos_embedding
    core.models.common.embeddings.yarn_rotary_pos_embedding
    core.models.common.language_module
    core.models.common.language_module.language_module
    core.models.common.model_chunk_schedule_plan
    core.models.common.vision_module
    core.models.common.vision_module.vision_module
    core.models.gpt
    core.models.gpt.fine_grained_callables
    core.models.gpt.gpt_layer_specs
    core.models.gpt.gpt_model
    core.models.gpt.moe_module_specs
    core.models.huggingface
    core.models.huggingface.clip_model
    core.models.huggingface.module
    core.models.huggingface.qwen_model
    core.models.mamba
    core.models.mamba.mamba_layer_specs
    core.models.mamba.mamba_model
    core.models.mimo
    core.models.mimo.config
    core.models.mimo.config.base_configs
    core.models.mimo.model
    core.models.mimo.model.base
    core.models.multimodal
    core.models.multimodal.context_parallel
    core.models.multimodal.llava_model
    core.models.multimodal.llava_spec
    core.models.retro
    core.models.retro.base_attention
    core.models.retro.config
    core.models.retro.decoder_attention
    core.models.retro.decoder_spec
    core.models.retro.encoder_attention
    core.models.retro.encoder_spec
    core.models.retro.model
    core.models.retro.utils
    core.models.T5
    core.models.T5.t5_model
    core.models.T5.t5_spec
    core.models.vision
    core.models.vision.clip_vit_model
    core.models.vision.multimodal_projector
    core.models.vision.radio
    core.models.vision.vit_layer_specs
    core.msc_utils
    core.nccl_allocator
    core.num_microbatches_calculator
    core.optimizer
    core.optimizer.clip_grads
    core.optimizer.cpu_offloading
    core.optimizer.cpu_offloading.hybrid_optimizer
    core.optimizer.distrib_optimizer
    core.optimizer.grad_scaler
    core.optimizer.optimizer
    core.optimizer.optimizer_config
    core.optimizer.qk_clip
    core.optimizer_param_scheduler
    core.package_info
    core.packed_seq_params
    core.parallel_state
    core.pipeline_parallel
    core.pipeline_parallel.bridge_communicator
    core.pipeline_parallel.combined_1f1b
    core.pipeline_parallel.p2p_communication
    core.pipeline_parallel.schedules
    core.pipeline_parallel.utils
    core.post_training
    core.post_training.modelopt
    core.post_training.modelopt.gpt
    core.post_training.modelopt.gpt.model_specs
    core.post_training.modelopt.gpt.state_dict_hooks
    core.post_training.modelopt.layers
    core.post_training.modelopt.mamba
    core.post_training.modelopt.mamba.model_specs
    core.process_groups_config
    core.quantization
    core.quantization.quant_config
    core.quantization.utils
    core.rerun_state_machine
    core.safe_globals
    core.ssm
    core.ssm.mamba_block
    core.ssm.mamba_context_parallel
    core.ssm.mamba_hybrid_layer_allocation
    core.ssm.mamba_layer
    core.ssm.mamba_mixer
    core.ssm.mlp_layer
    core.ssm.triton_cache_manager
    core.tensor_parallel
    core.tensor_parallel.cross_entropy
    core.tensor_parallel.data
    core.tensor_parallel.inference_layers
    core.tensor_parallel.layers
    core.tensor_parallel.mappings
    core.tensor_parallel.random
    core.tensor_parallel.utils
    core.timers
    core.tokenizers
    core.tokenizers.base_tokenizer
    core.tokenizers.megatron_tokenizer
    core.tokenizers.text
    core.tokenizers.text.libraries
    core.tokenizers.text.libraries.abstract_tokenizer
    core.tokenizers.text.libraries.bytelevel_tokenizer
    core.tokenizers.text.libraries.chat_template
    core.tokenizers.text.libraries.huggingface_tokenizer
    core.tokenizers.text.libraries.megatron_hf_tokenizer
    core.tokenizers.text.libraries.null_tokenizer
    core.tokenizers.text.libraries.sentencepiece_tokenizer
    core.tokenizers.text.libraries.tiktoken_tokenizer
    core.tokenizers.text.models
    core.tokenizers.text.models.bert_tokenizer
    core.tokenizers.text.models.default_tokenizer
    core.tokenizers.text.models.gpt_tokenizer
    core.tokenizers.text.models.mamba_tokenizer
    core.tokenizers.text.models.retro_tokenizer
    core.tokenizers.text.models.t5_tokenizer
    core.tokenizers.text.text_tokenizer
    core.transformer
    core.transformer.attention
    core.transformer.cuda_graphs
    core.transformer.custom_layers
    core.transformer.custom_layers.batch_invariant_kernels
    core.transformer.custom_layers.transformer_engine
    core.transformer.dot_product_attention
    core.transformer.enums
    core.transformer.fsdp_dtensor_checkpoint
    core.transformer.identity_op
    core.transformer.mlp
    core.transformer.module
    core.transformer.moe
    core.transformer.moe.experts
    core.transformer.moe.fused_a2a
    core.transformer.moe.grouped_gemm_util
    core.transformer.moe.moe_layer
    core.transformer.moe.moe_utils
    core.transformer.moe.router
    core.transformer.moe.shared_experts
    core.transformer.moe.token_dispatcher
    core.transformer.moe.upcycling_utils
    core.transformer.multi_latent_attention
    core.transformer.multi_token_prediction
    core.transformer.pipeline_parallel_layer_layout
    core.transformer.spec_utils
    core.transformer.torch_layer_norm
    core.transformer.torch_norm
    core.transformer.transformer_block
    core.transformer.transformer_config
    core.transformer.transformer_layer
    core.transformer.utils
    core.utils