nemo_microservices.resources.v2.inference.deployments.deployments#

Module Contents#

Classes#

API#

class nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResource(
client: nemo_microservices._client.AsyncNeMoMicroservices,
)#

Bases: nemo_microservices._resource.AsyncAPIResource

Initialization

async create(
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Create ModelDeployment endpoint - returns a simple hello world response for now.

async delete(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) None#

Delete All ModelDeployment Versions endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

async list(
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

List ModelDeployments endpoint - returns a simple hello world response for now. Supports filter parameters for status.

async list_namespace(
namespace: str,
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

List ModelDeployments By Namespace endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property models: nemo_microservices.resources.v2.inference.deployments.models.AsyncModelsResource#
async retrieve(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Get Latest ModelDeployment endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property status: nemo_microservices.resources.v2.inference.deployments.status.AsyncStatusResource#
async update(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Update ModelDeployment endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property versions: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResource#
property with_raw_response: nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResourceWithRawResponse(
deployments: nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResource,
)#

Initialization

property models: nemo_microservices.resources.v2.inference.deployments.models.AsyncModelsResourceWithRawResponse#
property status: nemo_microservices.resources.v2.inference.deployments.status.AsyncStatusResourceWithRawResponse#
property versions: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithRawResponse#
class nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResourceWithStreamingResponse(
deployments: nemo_microservices.resources.v2.inference.deployments.deployments.AsyncDeploymentsResource,
)#

Initialization

property models: nemo_microservices.resources.v2.inference.deployments.models.AsyncModelsResourceWithStreamingResponse#
property status: nemo_microservices.resources.v2.inference.deployments.status.AsyncStatusResourceWithStreamingResponse#
property versions: nemo_microservices.resources.v2.inference.deployments.versions.AsyncVersionsResourceWithStreamingResponse#
class nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResource(
client: nemo_microservices._client.NeMoMicroservices,
)#

Bases: nemo_microservices._resource.SyncAPIResource

Initialization

create(
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Create ModelDeployment endpoint - returns a simple hello world response for now.

delete(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) None#

Delete All ModelDeployment Versions endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

list(
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

List ModelDeployments endpoint - returns a simple hello world response for now. Supports filter parameters for status.

list_namespace(
namespace: str,
*,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

List ModelDeployments By Namespace endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property models: nemo_microservices.resources.v2.inference.deployments.models.ModelsResource#
retrieve(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Get Latest ModelDeployment endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property status: nemo_microservices.resources.v2.inference.deployments.status.StatusResource#
update(
deployment_name: str,
*,
namespace: str,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) object#

Update ModelDeployment endpoint - returns a simple hello world response for now.

Args: extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property versions: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResource#
property with_raw_response: nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResourceWithRawResponse(
deployments: nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResource,
)#

Initialization

property models: nemo_microservices.resources.v2.inference.deployments.models.ModelsResourceWithRawResponse#
property status: nemo_microservices.resources.v2.inference.deployments.status.StatusResourceWithRawResponse#
property versions: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithRawResponse#
class nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResourceWithStreamingResponse(
deployments: nemo_microservices.resources.v2.inference.deployments.deployments.DeploymentsResource,
)#

Initialization

property models: nemo_microservices.resources.v2.inference.deployments.models.ModelsResourceWithStreamingResponse#
property status: nemo_microservices.resources.v2.inference.deployments.status.StatusResourceWithStreamingResponse#
property versions: nemo_microservices.resources.v2.inference.deployments.versions.VersionsResourceWithStreamingResponse#