API Reference#
This page contains auto-generated API reference documentation [1].
nemo_rlnemo_rl.datanemo_rl.data.packingnemo_rl.data.datasetsnemo_rl.data.datasets.response_datasetsnemo_rl.data.datasets.response_datasets.squadnemo_rl.data.datasets.response_datasets.response_datasetnemo_rl.data.datasets.response_datasets.openmathinstruct2nemo_rl.data.datasets.response_datasets.dapo_mathnemo_rl.data.datasets.response_datasets.oasstnemo_rl.data.datasets.response_datasets.gsm8knemo_rl.data.datasets.response_datasets.oai_format_datasetnemo_rl.data.datasets.response_datasets.deepscalernemo_rl.data.datasets.response_datasets.clevrnemo_rl.data.datasets.response_datasets.refcoconemo_rl.data.datasets.response_datasets.nemogym_datasetnemo_rl.data.datasets.response_datasets.geometry3knemo_rl.data.datasets.response_datasets.tulu3nemo_rl.data.datasets.response_datasets.aime24nemo_rl.data.datasets.response_datasets.helpsteer3nemo_rl.data.datasets.response_datasets.daily_omninemo_rl.data.datasets.response_datasets.general_conversations_dataset
nemo_rl.data.datasets.preference_datasetsnemo_rl.data.datasets.eval_datasetsnemo_rl.data.datasets.utilsnemo_rl.data.datasets.processed_datasetnemo_rl.data.datasets.raw_dataset
nemo_rl.data.dataloadernemo_rl.data.utilsnemo_rl.data.interfacesnemo_rl.data.multimodal_utilsnemo_rl.data.processorsnemo_rl.data.collate_fnnemo_rl.data.chat_templatesnemo_rl.data.llm_message_utils
nemo_rl.algorithmsnemo_rl.algorithms.lossnemo_rl.algorithms.sftnemo_rl.algorithms.utilsnemo_rl.algorithms.advantage_estimatornemo_rl.algorithms.grponemo_rl.algorithms.distillationnemo_rl.algorithms.async_utilsnemo_rl.algorithms.logits_sampling_utilsnemo_rl.algorithms.rmnemo_rl.algorithms.reward_functionsnemo_rl.algorithms.dpo
nemo_rl.modelsnemo_rl.models.huggingfacenemo_rl.models.dtensornemo_rl.models.megatronnemo_rl.models.policynemo_rl.models.automodelnemo_rl.models.generation
nemo_rl.distributednemo_rl.distributed.worker_groupsnemo_rl.distributed.virtual_clusternemo_rl.distributed.ray_actor_environment_registrynemo_rl.distributed.batched_data_dictnemo_rl.distributed.model_utilsnemo_rl.distributed.named_shardingnemo_rl.distributed.worker_group_utilsnemo_rl.distributed.stateless_process_groupnemo_rl.distributed.collectives
nemo_rl.evalsnemo_rl.utilsnemo_rl.utils.prefetch_venvsnemo_rl.utils.packed_tensornemo_rl.utils.loggernemo_rl.utils.venvsnemo_rl.utils.nsysnemo_rl.utils.memory_trackernemo_rl.utils.flops_trackernemo_rl.utils.flops_formulasnemo_rl.utils.native_checkpointnemo_rl.utils.nvmlnemo_rl.utils.confignemo_rl.utils.timernemo_rl.utils.checkpoint
nemo_rl.experiencenemo_rl.environmentsnemo_rl.environments.metricsnemo_rl.environments.utilsnemo_rl.environments.code_environmentnemo_rl.environments.nemo_gymnemo_rl.environments.code_jaccard_environmentnemo_rl.environments.dapo_math_verifiernemo_rl.environments.interfacesnemo_rl.environments.vlm_environmentnemo_rl.environments.math_environmentnemo_rl.environments.rewardsnemo_rl.environments.reward_model_environment
nemo_rl.package_info