nemo_rl.data
#
Subpackages#
nemo_rl.data.eval_datasets
nemo_rl.data.hf_datasets
nemo_rl.data.hf_datasets.chat_templates
nemo_rl.data.hf_datasets.openmathinstruct2
nemo_rl.data.hf_datasets.helpsteer3
nemo_rl.data.hf_datasets.squad
nemo_rl.data.hf_datasets.prompt_response_dataset
nemo_rl.data.hf_datasets.dpo
nemo_rl.data.hf_datasets.deepscaler
nemo_rl.data.hf_datasets.oasst
nemo_rl.data.hf_datasets.oai_format_dataset
nemo_rl.data.packing
Submodules#
Package Contents#
Classes#
API#
- class nemo_rl.data.DataConfig[source]#
Bases:
typing.TypedDict
- max_input_seq_length: int#
None
- prompt_file: NotRequired[str]#
None
- system_prompt_file: NotRequired[str]#
None
- dataset_name: str#
None
- val_dataset_name: NotRequired[str]#
None
- add_bos: NotRequired[bool]#
None
- add_eos: NotRequired[bool]#
None
- input_key: NotRequired[str]#
None
- output_key: NotRequired[str]#
None
- add_generation_prompt: NotRequired[bool]#
None
- add_system_prompt: NotRequired[bool]#
None
- split: NotRequired[str]#
None
- class nemo_rl.data.MathDataConfig[source]#
Bases:
nemo_rl.data.DataConfig
- problem_key: str#
None
- solution_key: str#
None