core.inference#
Subpackages#
core.inference.text_generation_controllerscore.inference.text_generation_controllers.encoder_decoder_text_generation_controllercore.inference.text_generation_controllers.mtp_utils_pytorchcore.inference.text_generation_controllers.mtp_utils_tritoncore.inference.text_generation_controllers.text_generation_controllercore.inference.text_generation_controllers.vlm_text_generation_controller
core.inference.contextscore.inference.contexts.mamba_slot_allocatorcore.inference.contexts.kv_block_allocatorcore.inference.contexts.dynamic_contextcore.inference.contexts.routing_metadatacore.inference.contexts.gpu_viewcore.inference.contexts.fused_kv_append_kernelcore.inference.contexts.base_contextcore.inference.contexts.static_context
core.inference.enginescore.inference.moecore.inference.samplingcore.inference.text_generation_servercore.inference.model_inference_wrapperscore.inference.quantizationcore.inference.apis
Submodules#
core.inference.symmetric_memorycore.inference.communication_utilscore.inference.async_streamcore.inference.configcore.inference.unified_memorycore.inference.utilscore.inference.batch_dimensions_utilscore.inference.inference_clientcore.inference.sampling_paramscore.inference.common_inference_paramscore.inference.schedulercore.inference.data_parallel_inference_coordinatorcore.inference.headerscore.inference.inference_request