nemo_rl.experience.interfaces#

Module Contents#

Classes#

Completion

A single generated completion for one prompt.

PromptGroupRecord

All completions for a single prompt, with prompt-level metadata.

API#

class nemo_rl.experience.interfaces.Completion#

A single generated completion for one prompt.

message_log: nemo_rl.data.interfaces.LLMMessageLogType | nemo_rl.data.interfaces.VLMMessageLogType#

None

env_extras: Optional[dict[str, Any]]#

None

truncated: bool#

None

reward: float#

None

class nemo_rl.experience.interfaces.PromptGroupRecord#

All completions for a single prompt, with prompt-level metadata.

prompt_idx: int#

None

prompt: nemo_rl.data.interfaces.LLMMessageLogType | nemo_rl.data.interfaces.VLMMessageLogType#

None

extra_env_info: Optional[dict[str, Any]]#

None

metadata: dict[str, Any]#

None

completions: list[nemo_rl.experience.interfaces.Completion]#

None

rollout_metrics: dict[str, Any]#

None