NeMo NIM Proxy Target#
The following target references the DeepSeek R2 Distill Llama 8B model from NVIDIA NeMo NIM Proxy in the same Kubernetes namespace.
Refer to garak.generators.nim.NVOpenAIChat for the parameters to specify in the options.nim field.
The options override the default values from the DEFAULT_PARAMS in the API reference.
Important
Export the NIM_API_KEY environment variable with your API key or any value when you start the microservice container.
The environment variable must be set even if it is not used to access build.nvidia.com.
import os
from nemo_microservices import NeMoMicroservices
client = NeMoMicroservices(base_url=os.getenv("AUDITOR_BASE_URL"))
target = client.beta.audit.targets.create(
    namespace="default",
    name="demo-nemo-platform-target",
    type="nim.NVOpenAIChat",
    model="deepseek-ai/deepseek-r1-distill-llama-8b",
    options={
        "nim": {
            "skip_seq_start": "<think>",
            "skip_seq_end": "</think>",
            "max_tokens": 3200,
            "uri": "http://nemo-nim-proxy:8000/v1/"
        }
    }
)
print(target.model_dump_json(indent=2))
curl -X POST "${AUDITOR_BASE_URL}/v1beta1/audit/targets" \
  -H "Accept: application/json" \
  -H "Content-Type: application/json" \
  -d '{
    "namespace": "default",
    "name": "demo-nemo-platform-target",
    "type": "nim.NVOpenAIChat",
    "model": "deepseek-ai/deepseek-r1-distill-llama-8b",
    "options": {
      "nim": {
          "skip_seq_start": "<think>",
          "skip_seq_end": "</think>",
          "max_tokens": 3200,
          "uri": "http://nemo-nim-proxy:8000/v1/"
      }
    }
  }' | jq
Example Output
{
  "model": "deepseek-ai/deepseek-r1-distill-llama-8b",
  "type": "nim.NVOpenAIChat",
  "id": "audit_target-YZooRAoDqCBLGGcApuBasL",
  "created_at": "2025-09-24T14:38:49.990401",
  "custom_fields": {},
  "description": null,
  "entity_id": "audit_target-YZooRAoDqCBLGGcApuBasL",
  "name": "demo-nemo-platform-target",
  "namespace": "default",
  "options": {
    "nim": {
      "skip_seq_start": "<think>",
      "skip_seq_end": "</think>",
      "max_tokens": 3200,
      "uri": "http://nemo-nim-proxy:8000/v1/"
    }
  },
  "ownership": null,
  "project": null,
  "schema_version": "1.0",
  "type_prefix": null,
  "updated_at": "2025-09-24T14:38:49.990404"
}
{
  "schema_version": "1.0",
  "id": "audit_target-TPhoKFape4CdzRTy2HzACK",
  "description": null,
  "type_prefix": null,
  "namespace": "default",
  "project": null,
  "created_at": "2025-08-18T12:37:46.877294",
  "updated_at": "2025-08-18T12:37:46.877298",
  "custom_fields": {},
  "ownership": null,
  "name": "demo-nemo-platform-target",
  "entity_id": "audit_target-TPhoKFape4CdzRTy2HzACK",
  "type": "nim.NVOpenAIChat",
  "model": "deepseek-ai/deepseek-r1-distill-llama-8b",
  "options": {
    "nim": {
      "skip_seq_start": "<think>",
      "skip_seq_end": "</think>",
      "max_tokens": 3200,
      "uri": "http://nemo-nim-proxy:8000/v1/"
    }
  }
}