nemo_microservices.resources.v2.inference.deployments.versions#

Module Contents#

Classes#

API#

class nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResource(
client: nemo_microservices._client.AsyncNeMoMicroservices,
)#

Bases: nemo_microservices._resource.AsyncAPIResource

Initialization

async delete(
version: str,
*,
namespace: str,
deployment_name: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Delete a specific version of a ModelDeployment.

If the deployment is in any state other than DELETED, this will set its status to DELETING. The models controller will then:

  1. Delete the infrastructure (e.g., K8s NimService)

  2. Update the status to DELETED

If the deployment is already in DELETED status, calling delete again will permanently remove it from the database.

Returns:

  • 202 Accepted: Deployment version marked for deletion (status set to DELETING)

  • 204 No Content: Deployment version permanently removed from database (was already DELETED)

  • 404 Not Found: Deployment version doesn’t exist

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

async list(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.deployments.version_list_response.VersionListResponse#

List all versions of a ModelDeployment.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

async retrieve(
version: str,
*,
namespace: str,
deployment_name: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.model_deployment.ModelDeployment#

Get a specific version of a ModelDeployment.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property with_raw_response: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithRawResponse(
versions: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithStreamingResponse(
versions: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.deployments.versions.VersionsResource(client: nemo_microservices._client.NeMoMicroservices)#

Bases: nemo_microservices._resource.SyncAPIResource

Initialization

delete(
version: str,
*,
namespace: str,
deployment_name: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Delete a specific version of a ModelDeployment.

If the deployment is in any state other than DELETED, this will set its status to DELETING. The models controller will then:

  1. Delete the infrastructure (e.g., K8s NimService)

  2. Update the status to DELETED

If the deployment is already in DELETED status, calling delete again will permanently remove it from the database.

Returns:

  • 202 Accepted: Deployment version marked for deletion (status set to DELETING)

  • 204 No Content: Deployment version permanently removed from database (was already DELETED)

  • 404 Not Found: Deployment version doesn’t exist

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

list(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.deployments.version_list_response.VersionListResponse#

List all versions of a ModelDeployment.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

retrieve(
version: str,
*,
namespace: str,
deployment_name: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.model_deployment.ModelDeployment#

Get a specific version of a ModelDeployment.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property with_raw_response: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithRawResponse(
versions: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithStreamingResponse(
versions: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResource,
)#

Initialization