nemo_curator.stages.video.embedding.cosmos_embed1

View as Markdown

Module Contents

Classes

NameDescription
CosmosEmbed1EmbeddingStageStage for embedding Cosmos-Embed1 frames into a vector space.
CosmosEmbed1FrameCreationStageStage for creating Cosmos-Embed1 input frames from video clips.

API

class nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage(
model_dir: str = 'models/cosmos_embed1',
variant: typing.Literal['224p', '336p', '448p'] = '336p',
texts_to_verify: list[str] | None = None,
gpu_memory_gb: int = 20,
verbose: bool = False,
name: str = 'cosmos_embed1_embedding'
)
Dataclass

Bases: ProcessingStage[VideoTask, VideoTask]

Stage for embedding Cosmos-Embed1 frames into a vector space.

This class processes video clips through a series of steps including frame extraction, model initialization, and input frame creation.

gpu_memory_gb
int = 20
model_dir
str = 'models/cosmos_embed1'
name
str = 'cosmos_embed1_embedding'
texts_to_verify
list[str] | None = None
variant
Literal['224p', '336p', '448p'] = '336p'
verbose
bool = False
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.__post_init__() -> None
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.inputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.outputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.process(
task: nemo_curator.tasks.video.VideoTask
) -> nemo_curator.tasks.video.VideoTask
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.setup(
worker_metadata: nemo_curator.backends.base.WorkerMetadata | None = None
) -> None
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1EmbeddingStage.setup_on_node(
node_info: nemo_curator.backends.base.NodeInfo,
worker_metadata: nemo_curator.backends.base.WorkerMetadata
) -> None

Download the weights for the CosmosEmbed1 model on the node.

class nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage(
model_dir: str = 'models/cosmos_embed1',
variant: typing.Literal['224p', '336p', '448p'] = '336p',
target_fps: float = 2.0,
verbose: bool = False,
num_cpus: int = 3,
name: str = 'cosmos_embed1'
)
Dataclass

Bases: ProcessingStage[VideoTask, VideoTask]

Stage for creating Cosmos-Embed1 input frames from video clips.

This class processes video clips through a series of steps including frame extraction, model initialization, and input frame creation.

model_dir
str = 'models/cosmos_embed1'
name
str = 'cosmos_embed1'
num_cpus
int = 3
target_fps
float = 2.0
variant
Literal['224p', '336p', '448p'] = '336p'
verbose
bool = False
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage.inputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage.outputs() -> tuple[list[str], list[str]]
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage.process(
task: nemo_curator.tasks.video.VideoTask
) -> nemo_curator.tasks.video.VideoTask
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage.setup(
worker_metadata: nemo_curator.backends.base.WorkerMetadata | None = None
) -> None
nemo_curator.stages.video.embedding.cosmos_embed1.CosmosEmbed1FrameCreationStage.setup_on_node(
node_info: nemo_curator.backends.base.NodeInfo,
worker_metadata: nemo_curator.backends.base.WorkerMetadata
) -> None

Download the weights for the CosmosEmbed1 model on the node.