nemo_rl.models.generation.vllm.config
#
Module Contents#
Classes#
API#
- class nemo_rl.models.generation.vllm.config.VllmSpecificArgs#
Bases:
typing.TypedDict
- tensor_parallel_size: int#
None
- pipeline_parallel_size: int#
None
- gpu_memory_utilization: float#
None
- max_model_len: int#
None
- skip_tokenizer_init: bool#
None
- async_engine: bool#
None
- load_format: NotRequired[str]#
None
- precision: NotRequired[str]#
None
- enforce_eager: NotRequired[bool]#
None
- class nemo_rl.models.generation.vllm.config.VllmConfig#
Bases:
nemo_rl.models.generation.interfaces.GenerationConfig
- vllm_cfg: nemo_rl.models.generation.vllm.config.VllmSpecificArgs#
None
- vllm_kwargs: NotRequired[dict[str, Any]]#
None