<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="https://www.sitemaps.org/schemas/sitemap/0.9">
  <url>
    <loc>https://docs.nvidia.com/aiperf/welcome-to-ai-perf-documentation</loc>
    <lastmod>2026-05-30T01:03:58.349Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/profiling-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.352Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/ai-perf-comprehensive-llm-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.354Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/migrating-from-gen-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.356Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/gen-ai-perf-vs-ai-perf-cli-feature-comparison-matrix</loc>
    <lastmod>2026-05-30T01:03:58.358Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-open-ai-compatible-text-ap-is-using-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.360Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-the-open-ai-responses-api-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.362Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-hugging-face-tgi-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.364Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-vision-language-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.365Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-audio-language-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.367Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-asr-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.369Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-embedding-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.371Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-ranking-models-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.373Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-nim-image-retrieval-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.375Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-generation</loc>
    <lastmod>2026-05-30T01:03:58.376Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-edit</loc>
    <lastmod>2026-05-30T01:03:58.378Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-video-generation</loc>
    <lastmod>2026-05-30T01:03:58.380Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/synthetic-video-generation</loc>
    <lastmod>2026-05-30T01:03:58.382Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/template-endpoint</loc>
    <lastmod>2026-05-30T01:03:58.384Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-dataset-guide</loc>
    <lastmod>2026-05-30T01:03:58.386Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inline-datasets</loc>
    <lastmod>2026-05-30T01:03:58.388Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-prompt-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.390Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-share-gpt-dataset</loc>
    <lastmod>2026-05-30T01:03:58.391Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/synthetic-dataset-generation</loc>
    <lastmod>2026-05-30T01:03:58.393Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-instruct-coder-dataset</loc>
    <lastmod>2026-05-30T01:03:58.395Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-aimo-dataset</loc>
    <lastmod>2026-05-30T01:03:58.397Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mm-star-dataset</loc>
    <lastmod>2026-05-30T01:03:58.399Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mmvu-dataset</loc>
    <lastmod>2026-05-30T01:03:58.401Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-l-la-va-one-vision-dataset</loc>
    <lastmod>2026-05-30T01:03:58.403Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-vision-arena-dataset</loc>
    <lastmod>2026-05-30T01:03:58.404Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-blazedit-dataset</loc>
    <lastmod>2026-05-30T01:03:58.406Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-spec-bench-dataset</loc>
    <lastmod>2026-05-30T01:03:58.408Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-speed-bench-dataset</loc>
    <lastmod>2026-05-30T01:03:58.410Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-bailian-traces</loc>
    <lastmod>2026-05-30T01:03:58.412Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-burst-gpt-traces</loc>
    <lastmod>2026-05-30T01:03:58.414Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/replay-sage-maker-data-capture-traces</loc>
    <lastmod>2026-05-30T01:03:58.416Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/raw-payload-replay</loc>
    <lastmod>2026-05-30T01:03:58.417Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inputs-json-replay</loc>
    <lastmod>2026-05-30T01:03:58.419Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/multi-turn-conversations</loc>
    <lastmod>2026-05-30T01:03:58.421Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/sequence-length-distributions-for-advanced-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.423Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/prefix-data-synthesis-tutorial</loc>
    <lastmod>2026-05-30T01:03:58.425Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/agentic-code-dataset-generator</loc>
    <lastmod>2026-05-30T01:03:58.426Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/arrival-patterns-simulating-realistic-traffic</loc>
    <lastmod>2026-05-30T01:03:58.428Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/fixed-schedule-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.430Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/gradual-ramping</loc>
    <lastmod>2026-05-30T01:03:58.432Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-rate-with-max-concurrency</loc>
    <lastmod>2026-05-30T01:03:58.434Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/prefill-concurrency-fine-grained-benchmarking-control</loc>
    <lastmod>2026-05-30T01:03:58.436Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/time-based-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.437Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/multi-url-load-balancing</loc>
    <lastmod>2026-05-30T01:03:58.439Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-cancellation-testing</loc>
    <lastmod>2026-05-30T01:03:58.441Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/warmup-phase-configuration</loc>
    <lastmod>2026-05-30T01:03:58.443Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/benchmark-goodput-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.445Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/multi-run-confidence-reporting</loc>
    <lastmod>2026-05-30T01:03:58.447Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/parameter-sweeps</loc>
    <lastmod>2026-05-30T01:03:58.448Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/adaptive-search</loc>
    <lastmod>2026-05-30T01:03:58.450Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/time-slicing-for-performance-analysis</loc>
    <lastmod>2026-05-30T01:03:58.452Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/http-trace-metrics-guide</loc>
    <lastmod>2026-05-30T01:03:58.454Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/working-with-profile-export-files</loc>
    <lastmod>2026-05-30T01:03:58.456Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/visualization-and-plotting-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.457Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/auto-plot-after-aiperf-profile</loc>
    <lastmod>2026-05-30T01:03:58.459Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/user-centric-timing-for-kv-cache-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.461Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/gpu-telemetry-with-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.463Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/open-telemetry-m-lflow-integration</loc>
    <lastmod>2026-05-30T01:03:58.465Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/yaml-configuration-files</loc>
    <lastmod>2026-05-30T01:03:58.467Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/sampling-distributions-in-yaml-configs</loc>
    <lastmod>2026-05-30T01:03:58.469Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/user-interface</loc>
    <lastmod>2026-05-30T01:03:58.471Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/using-local-tokenizers-without-hugging-face</loc>
    <lastmod>2026-05-30T01:03:58.472Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/random-number-generation-reproducibility</loc>
    <lastmod>2026-05-30T01:03:58.474Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/search-recipes</loc>
    <lastmod>2026-05-30T01:03:58.476Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/bayesian-optimization</loc>
    <lastmod>2026-05-30T01:03:58.478Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/space-filling-sweeps-sobol-latin-hypercube</loc>
    <lastmod>2026-05-30T01:03:58.480Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/load-generator-options-reference</loc>
    <lastmod>2026-05-30T01:03:58.481Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/trace-replay-with-mooncake-traces</loc>
    <lastmod>2026-05-30T01:03:58.483Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/conversation-dag-benchmarks</loc>
    <lastmod>2026-05-30T01:03:58.485Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/accuracy/accuracy-benchmarking</loc>
    <lastmod>2026-05-30T01:03:58.487Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/command-line-options</loc>
    <lastmod>2026-05-30T01:03:58.489Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/environment-variables</loc>
    <lastmod>2026-05-30T01:03:58.491Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/ai-perf-metrics-reference</loc>
    <lastmod>2026-05-30T01:03:58.492Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/benchmark-datasets</loc>
    <lastmod>2026-05-30T01:03:58.494Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/pre-flight-tokenizer-auto-detection</loc>
    <lastmod>2026-05-30T01:03:58.496Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/conversation-context-mode</loc>
    <lastmod>2026-05-30T01:03:58.498Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/list-metric-aggregation</loc>
    <lastmod>2026-05-30T01:03:58.500Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/vendor-usage-field-reference</loc>
    <lastmod>2026-05-30T01:03:58.501Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/json-export-schema</loc>
    <lastmod>2026-05-30T01:03:58.503Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/http-api-endpoints</loc>
    <lastmod>2026-05-30T01:03:58.506Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/yaml-config-roadmap</loc>
    <lastmod>2026-05-30T01:03:58.508Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/server-metrics-collection</loc>
    <lastmod>2026-05-30T01:03:58.509Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-reference</loc>
    <lastmod>2026-05-30T01:03:58.511Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-json-export-schema</loc>
    <lastmod>2026-05-30T01:03:58.513Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-parquet-export-schema</loc>
    <lastmod>2026-05-30T01:03:58.515Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/ai-perf-plugin-system</loc>
    <lastmod>2026-05-30T01:03:58.517Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/creating-your-first-ai-perf-plugin</loc>
    <lastmod>2026-05-30T01:03:58.519Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/prefix-synthesis-api-reference</loc>
    <lastmod>2026-05-30T01:03:58.521Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/sweep-aggregates-api-reference</loc>
    <lastmod>2026-05-30T01:03:58.523Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/search-history-api-reference</loc>
    <lastmod>2026-05-30T01:03:58.524Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/architecture-of-ai-perf</loc>
    <lastmod>2026-05-30T01:03:58.526Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/metrics-flow</loc>
    <lastmod>2026-05-30T01:03:58.528Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/mixins</loc>
    <lastmod>2026-05-30T01:03:58.530Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/ai-perf-code-patterns</loc>
    <lastmod>2026-05-30T01:03:58.531Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/global-property-test-invariants</loc>
    <lastmod>2026-05-30T01:03:58.533Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/sweep-orchestrator-dev-reference</loc>
    <lastmod>2026-05-30T01:03:58.535Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/yaml-config-future-goals</loc>
    <lastmod>2026-05-30T01:03:58.537Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/troubleshooting/sweep-adaptive-search-errors</loc>
    <lastmod>2026-05-30T01:03:58.539Z</lastmod>
  </url>
</urlset>
