synthetic.async_nemotron_cc#

Module Contents#

Classes#

API#

class synthetic.async_nemotron_cc.AsyncNemotronCCGenerator(
llm_client: nemo_curator.services.AsyncLLMClient,
)#

Initialization

async distill(
document: str,
model: str,
prompt_template: str = DISTILL_PROMPT_TEMPLATE,
system_prompt: str = NEMOTRON_CC_DISTILL_SYSTEM_PROMPT,
prompt_kwargs: dict | None = None,
model_kwargs: dict | None = None,
) list[str]#
async extract_knowledge(
document: str,
model: str,
prompt_template: str = EXTRACT_KNOWLEDGE_PROMPT_TEMPLATE,
system_prompt: str = NEMOTRON_CC_SYSTEM_PROMPT,
prompt_kwargs: dict | None = None,
model_kwargs: dict | None = None,
) list[str]#
async generate_diverse_qa(
document: str,
model: str,
prompt_template: str = DIVERSE_QA_PROMPT_TEMPLATE,
system_prompt: str = NEMOTRON_CC_SYSTEM_PROMPT,
prompt_kwargs: dict | None = None,
model_kwargs: dict | None = None,
) list[str]#
async generate_knowledge_list(
document: str,
model: str,
prompt_template: str = KNOWLEDGE_LIST_PROMPT_TEMPLATE,
system_prompt: str = NEMOTRON_CC_SYSTEM_PROMPT,
prompt_kwargs: dict | None = None,
model_kwargs: dict | None = None,
) list[str]#
async rewrite_to_wikipedia_style(
document: str,
model: str,
prompt_template: str = WIKIPEDIA_REPHRASING_PROMPT_TEMPLATE,
system_prompt: str = NEMOTRON_CC_SYSTEM_PROMPT,
prompt_kwargs: dict | None = None,
model_kwargs: dict | None = None,
) list[str]#