core.transformer#
Subpackages#
core.transformer.moecore.transformer.moe.shared_expertscore.transformer.moe.router_replaycore.transformer.moe.fused_a2acore.transformer.moe.moe_utilscore.transformer.moe.upcycling_utilscore.transformer.moe.token_dispatchercore.transformer.moe.expertscore.transformer.moe.routercore.transformer.moe.moe_layercore.transformer.moe.grouped_gemm_util
core.transformer.custom_layers
Submodules#
core.transformer.attentioncore.transformer.transformer_layercore.transformer.multi_latent_attentioncore.transformer.transformer_configcore.transformer.torch_normcore.transformer.transformer_blockcore.transformer.torch_layer_normcore.transformer.pipeline_parallel_layer_layoutcore.transformer.modulecore.transformer.fsdp_dtensor_checkpointcore.transformer.utilscore.transformer.spec_utilscore.transformer.mlpcore.transformer.dot_product_attentioncore.transformer.multi_token_predictioncore.transformer.enumscore.transformer.cuda_graphscore.transformer.identity_op