nemo_microservices.resources.v2.inference.providers.status#

Module Contents#

Classes#

API#

class nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResource(
client: nemo_microservices._client.AsyncNeMoMicroservices,
)#

Bases: nemo_microservices._resource.AsyncAPIResource

Initialization

async update(
provider_name: str,
*,
namespace: str,
model_deployment_id: str | nemo_microservices._types.Omit = omit,
served_models: Iterable[nemo_microservices.types.v2.inference.served_model_mapping_param.ServedModelMappingParam] | nemo_microservices._types.Omit = omit,
status: nemo_microservices.types.v2.inference.model_provider_status.ModelProviderStatus | nemo_microservices._types.Omit = omit,
status_message: str | nemo_microservices._types.Omit = omit,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.model_provider.ModelProvider#

Update status-related fields of a model provider.

This endpoint supports partial updates for fields managed by Models Controller:

  • model_deployment_id

  • served_models

  • status

  • status_message

If status is provided without status_message, status_message will be set to empty string.

Args: model_deployment_id: Reference to the ModelDeployment ID if this provider is associated with a deployment

served_models: List of models served by this provider with routing information for IGW

status: Status enum for ModelProvider objects.

status_message: Status message. If status is provided without status_message, defaults to empty string.

extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property with_raw_response: nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResourceWithRawResponse(
status: nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResourceWithStreamingResponse(
status: nemo_microservices.resources.v2.inference.providers.status.AsyncStatusResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.providers.status.StatusResource(client: nemo_microservices._client.NeMoMicroservices)#

Bases: nemo_microservices._resource.SyncAPIResource

Initialization

update(
provider_name: str,
*,
namespace: str,
model_deployment_id: str | nemo_microservices._types.Omit = omit,
served_models: Iterable[nemo_microservices.types.v2.inference.served_model_mapping_param.ServedModelMappingParam] | nemo_microservices._types.Omit = omit,
status: nemo_microservices.types.v2.inference.model_provider_status.ModelProviderStatus | nemo_microservices._types.Omit = omit,
status_message: str | nemo_microservices._types.Omit = omit,
extra_headers: nemo_microservices._types.Headers | None = None,
extra_query: nemo_microservices._types.Query | None = None,
extra_body: nemo_microservices._types.Body | None = None,
timeout: float | httpx.Timeout | None | nemo_microservices._types.NotGiven = not_given,
) nemo_microservices.types.v2.inference.model_provider.ModelProvider#

Update status-related fields of a model provider.

This endpoint supports partial updates for fields managed by Models Controller:

  • model_deployment_id

  • served_models

  • status

  • status_message

If status is provided without status_message, status_message will be set to empty string.

Args: model_deployment_id: Reference to the ModelDeployment ID if this provider is associated with a deployment

served_models: List of models served by this provider with routing information for IGW

status: Status enum for ModelProvider objects.

status_message: Status message. If status is provided without status_message, defaults to empty string.

extra_headers: Send extra headers

extra_query: Add additional query parameters to the request

extra_body: Add additional JSON properties to the request

timeout: Override the client-level default timeout for this request, in seconds

property with_raw_response: nemo_microservices.resources.v2.inference.providers.status.StatusResourceWithRawResponse#

This property can be used as a prefix for any HTTP method call to return the raw response object instead of the parsed content.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#accessing-raw-response-data-e-g-headers

property with_streaming_response: nemo_microservices.resources.v2.inference.providers.status.StatusResourceWithStreamingResponse#

An alternative to .with_raw_response that doesn’t eagerly read the response body.

For more information, see https://docs.nvidia.com/nemo/microservices/latest/pysdk/index.html#with_streaming_response

class nemo_microservices.resources.v2.inference.providers.status.StatusResourceWithRawResponse(
status: nemo_microservices.resources.v2.inference.providers.status.StatusResource,
)#

Initialization

class nemo_microservices.resources.v2.inference.providers.status.StatusResourceWithStreamingResponse(
status: nemo_microservices.resources.v2.inference.providers.status.StatusResource,
)#

Initialization