bridge.models.glm_vl.glm_45v_provider#

Module Contents#

Classes#

GLM45VModelProvider

Base model provider for GLM 4.5 Vision-Language (VL) Models.

API#

class bridge.models.glm_vl.glm_45v_provider.GLM45VModelProvider#

Bases: megatron.bridge.models.GLM45AirModelProvider106B

Base model provider for GLM 4.5 Vision-Language (VL) Models.

scatter_embedding_sequence_parallel: bool#

False

position_embedding_type: str#

‘mrope’

mrope_section: List[int]#

‘field(…)’

vision_config: transformers.models.glm4v.configuration_glm4v.Glm4vVisionConfig#

‘field(…)’

eos_token_id: int#

151329

image_start_token_id: int#

151339

image_end_token_id: int#

151340

video_start_token_id: int#

151341

video_end_token_id: int#

151342

image_token_id: int#

151363

video_token_id: int#

151364

freeze_language_model: bool#

False

freeze_vision_model: bool#

False

freeze_vision_projection: bool#

False

provide(
pre_process=None,
post_process=None,
vp_stage=None,
) bridge.models.glm_vl.modeling_glm_45v.GLM45VModel#
provide_language_model(
pre_process=None,
post_process=None,
vp_stage=None,
) megatron.core.models.gpt.GPTModel#