nemo_microservices.types.deployment.model_deployment_create_params#

Module Contents#

Classes#

Data#

API#

nemo_microservices.types.deployment.model_deployment_create_params.Config: typing_extensions.TypeAlias#

None

class nemo_microservices.types.deployment.model_deployment_create_params.ModelDeploymentCreateParams#

Bases: typing_extensions.TypedDict

async_enabled: bool#

None

Whether the async mode is enabled.

config: typing_extensions.Required[Config]#

None

The deployment configuration.

custom_fields: Dict[str, object]#

None

A set of custom fields that the user can define and use for various purposes.

description: str#

None

The description of the entity.

hf_token: str#

None

Hugging Face authentication token for accessing private models and repositories. This token will be stored as a Kubernetes secret and mounted as an environment variable (HF_TOKEN) in the NIM deployment. The secret will be automatically cleaned up when the model deployment is deleted.

models: nemo_microservices._types.SequenceNotStr[str]#

None

The models served by this deployment.

name: str#

None

The name of the identity.

Must be unique inside the namespace. If not specified, it will be the same as the automatically generated id.

namespace: str#

None

The if of the namespace of the entity.

This can be missing for namespace entities or in deployments that don’t use namespaces.

ownership: nemo_microservices.types.shared_params.ownership.Ownership#

None

Information about ownership of an entity.

If the entity is a namespace, the access_policies will typically apply to all entities inside the namespace.

project: str#

None

The id of project associated with this entity.