nemo_curator.stages.video.caption.caption_preparation

View as Markdown

Module Contents

Classes

NameDescription
CaptionPreparationStageStage that prepares captions for video processing.

Functions

NameDescription
_get_prompt-

Data

_ENHANCE_PROMPTS

_PROMPTS

API

class nemo_curator.stages.video.caption.caption_preparation.CaptionPreparationStage(
model_variant: str = 'qwen',
prompt_variant: str = 'default',
prompt_text: str | None = None,
verbose: bool = False,
sampling_fps: float = 2.0,
window_size: int = 256,
remainder_threshold: int = 128,
model_does_preprocess: bool = False,
preprocess_dtype: str = 'float32',
generate_previews: bool = True,
name: str = 'caption_preparation'
)
Dataclass

Bases: ProcessingStage[VideoTask, VideoTask]

Stage that prepares captions for video processing.

generate_previews
bool = True
model_does_preprocess
bool = False
model_variant
str = 'qwen'
name
str = 'caption_preparation'
preprocess_dtype
str = 'float32'
prompt_text
str | None = None
prompt_variant
str = 'default'
remainder_threshold
int = 128
sampling_fps
float = 2.0
verbose
bool = False
window_size
int = 256
nemo_curator.stages.video.caption.caption_preparation.CaptionPreparationStage.inputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.caption.caption_preparation.CaptionPreparationStage.outputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.caption.caption_preparation.CaptionPreparationStage.process(
task: nemo_curator.tasks.video.VideoTask
) -> nemo_curator.tasks.video.VideoTask
nemo_curator.stages.video.caption.caption_preparation.CaptionPreparationStage.setup(
worker_metadata: nemo_curator.backends.base.WorkerMetadata | None = None
) -> None
nemo_curator.stages.video.caption.caption_preparation._get_prompt(
prompt_variant: str,
prompt_text: str | None
) -> str
nemo_curator.stages.video.caption.caption_preparation._ENHANCE_PROMPTS = {'default': '\n You are a chatbot that enhances video caption inputs, add...
nemo_curator.stages.video.caption.caption_preparation._PROMPTS = {'default': '\n Elaborate on the visual and narrative elements of the vid...