nemo_rl.data#
Subpackages#
nemo_rl.data.packingnemo_rl.data.datasetsnemo_rl.data.datasets.response_datasetsnemo_rl.data.datasets.response_datasets.refcoconemo_rl.data.datasets.response_datasets.oai_format_datasetnemo_rl.data.datasets.response_datasets.squadnemo_rl.data.datasets.response_datasets.geometry3knemo_rl.data.datasets.response_datasets.oasstnemo_rl.data.datasets.response_datasets.response_datasetnemo_rl.data.datasets.response_datasets.openmathinstruct2nemo_rl.data.datasets.response_datasets.deepscalernemo_rl.data.datasets.response_datasets.clevrnemo_rl.data.datasets.response_datasets.dapo_math
nemo_rl.data.datasets.eval_datasetsnemo_rl.data.datasets.preference_datasetsnemo_rl.data.datasets.utilsnemo_rl.data.datasets.processed_dataset
Submodules#
Package Contents#
Classes#
API#
- class nemo_rl.data.DataConfig[source]#
Bases:
typing.TypedDict- max_input_seq_length: int#
None
- prompt_file: NotRequired[str]#
None
- system_prompt_file: NotRequired[str]#
None
- dataset_name: str#
None
- val_dataset_name: NotRequired[str]#
None
- add_bos: NotRequired[bool]#
None
- add_eos: NotRequired[bool]#
None
- input_key: NotRequired[str]#
None
- output_key: NotRequired[str]#
None
- add_generation_prompt: NotRequired[bool]#
None
- add_system_prompt: NotRequired[bool]#
None
- split: NotRequired[str]#
None
- shuffle: NotRequired[bool]#
None
- seed: NotRequired[int]#
None
- download_dir: NotRequired[str]#
None
- train_data_path: NotRequired[str]#
None
- val_data_paths: NotRequired[dict[str, str]]#
None
- num_workers: NotRequired[int]#
None
- class nemo_rl.data.MathDataConfig[source]#
Bases:
nemo_rl.data.DataConfig- problem_key: str#
None
- solution_key: str#
None