core.transformer#
Subpackages#
core.transformer.moecore.transformer.moe.shared_expertscore.transformer.moe.routercore.transformer.moe.moe_utilscore.transformer.moe.upcycling_utilscore.transformer.moe.moe_layercore.transformer.moe.grouped_gemm_utilcore.transformer.moe.router_replaycore.transformer.moe.expertscore.transformer.moe.fused_a2acore.transformer.moe.token_dispatcher
core.transformer.custom_layers
Submodules#
core.transformer.torch_layer_normcore.transformer.transformer_layercore.transformer.multi_token_predictioncore.transformer.modulecore.transformer.mlpcore.transformer.transformer_blockcore.transformer.identity_opcore.transformer.multi_latent_attentioncore.transformer.pipeline_parallel_layer_layoutcore.transformer.attentioncore.transformer.fsdp_dtensor_checkpointcore.transformer.enumscore.transformer.spec_utilscore.transformer.transformer_configcore.transformer.cuda_graphscore.transformer.torch_normcore.transformer.dot_product_attentioncore.transformer.utils