<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="https://www.sitemaps.org/schemas/sitemap/0.9">
  <url>
    <loc>https://docs.nvidia.com/aiperf/welcome-to-ai-perf-documentation</loc>
    <lastmod>2026-05-16T02:17:38.932Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/profiling-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.936Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/ai-perf-comprehensive-llm-benchmarking</loc>
    <lastmod>2026-05-16T02:17:38.939Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/migrating-from-gen-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.941Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/gen-ai-perf-vs-ai-perf-cli-feature-comparison-matrix</loc>
    <lastmod>2026-05-16T02:17:38.944Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-open-ai-compatible-text-ap-is-using-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.947Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-the-open-ai-responses-api-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.949Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-hugging-face-tgi-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.952Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-vision-language-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.954Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-audio-language-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.957Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-asr-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.959Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-embedding-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.962Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-ranking-models-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.964Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-nim-image-retrieval-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:38.967Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-generation</loc>
    <lastmod>2026-05-16T02:17:38.970Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-edit</loc>
    <lastmod>2026-05-16T02:17:38.972Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-video-generation</loc>
    <lastmod>2026-05-16T02:17:38.974Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/synthetic-video-generation</loc>
    <lastmod>2026-05-16T02:17:38.977Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/template-endpoint</loc>
    <lastmod>2026-05-16T02:17:38.979Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-dataset-guide</loc>
    <lastmod>2026-05-16T02:17:38.982Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inline-datasets</loc>
    <lastmod>2026-05-16T02:17:38.985Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-prompt-benchmarking</loc>
    <lastmod>2026-05-16T02:17:38.987Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-share-gpt-dataset</loc>
    <lastmod>2026-05-16T02:17:38.989Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/synthetic-dataset-generation</loc>
    <lastmod>2026-05-16T02:17:38.992Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-instruct-coder-dataset</loc>
    <lastmod>2026-05-16T02:17:38.994Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-aimo-dataset</loc>
    <lastmod>2026-05-16T02:17:38.997Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mm-star-dataset</loc>
    <lastmod>2026-05-16T02:17:38.999Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mmvu-dataset</loc>
    <lastmod>2026-05-16T02:17:39.002Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-l-la-va-one-vision-dataset</loc>
    <lastmod>2026-05-16T02:17:39.004Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-vision-arena-dataset</loc>
    <lastmod>2026-05-16T02:17:39.007Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-blazedit-dataset</loc>
    <lastmod>2026-05-16T02:17:39.009Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-spec-bench-dataset</loc>
    <lastmod>2026-05-16T02:17:39.011Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-speed-bench-dataset</loc>
    <lastmod>2026-05-16T02:17:39.014Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-bailian-traces</loc>
    <lastmod>2026-05-16T02:17:39.017Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-burst-gpt-traces</loc>
    <lastmod>2026-05-16T02:17:39.019Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/replay-sage-maker-data-capture-traces</loc>
    <lastmod>2026-05-16T02:17:39.021Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/raw-payload-replay</loc>
    <lastmod>2026-05-16T02:17:39.024Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inputs-json-replay</loc>
    <lastmod>2026-05-16T02:17:39.026Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/multi-turn-conversations</loc>
    <lastmod>2026-05-16T02:17:39.029Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/sequence-length-distributions-for-advanced-benchmarking</loc>
    <lastmod>2026-05-16T02:17:39.031Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/prefix-data-synthesis-tutorial</loc>
    <lastmod>2026-05-16T02:17:39.033Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/agentic-code-dataset-generator</loc>
    <lastmod>2026-05-16T02:17:39.036Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/arrival-patterns-simulating-realistic-traffic</loc>
    <lastmod>2026-05-16T02:17:39.038Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/fixed-schedule-benchmarking</loc>
    <lastmod>2026-05-16T02:17:39.041Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/gradual-ramping</loc>
    <lastmod>2026-05-16T02:17:39.043Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-rate-with-max-concurrency</loc>
    <lastmod>2026-05-16T02:17:39.046Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/prefill-concurrency-fine-grained-benchmarking-control</loc>
    <lastmod>2026-05-16T02:17:39.048Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/time-based-benchmarking</loc>
    <lastmod>2026-05-16T02:17:39.051Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/multi-url-load-balancing</loc>
    <lastmod>2026-05-16T02:17:39.053Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-cancellation-testing</loc>
    <lastmod>2026-05-16T02:17:39.056Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/warmup-phase-configuration</loc>
    <lastmod>2026-05-16T02:17:39.058Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/benchmark-goodput-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:39.060Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/multi-run-confidence-reporting</loc>
    <lastmod>2026-05-16T02:17:39.063Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/parameter-sweeps</loc>
    <lastmod>2026-05-16T02:17:39.065Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/adaptive-search</loc>
    <lastmod>2026-05-16T02:17:39.068Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/time-slicing-for-performance-analysis</loc>
    <lastmod>2026-05-16T02:17:39.070Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/http-trace-metrics-guide</loc>
    <lastmod>2026-05-16T02:17:39.073Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/working-with-profile-export-files</loc>
    <lastmod>2026-05-16T02:17:39.075Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/visualization-and-plotting-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:39.077Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/auto-plot-after-aiperf-profile</loc>
    <lastmod>2026-05-16T02:17:39.080Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/user-centric-timing-for-kv-cache-benchmarking</loc>
    <lastmod>2026-05-16T02:17:39.082Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/gpu-telemetry-with-ai-perf</loc>
    <lastmod>2026-05-16T02:17:39.085Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/open-telemetry-m-lflow-integration</loc>
    <lastmod>2026-05-16T02:17:39.087Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/yaml-configuration-files</loc>
    <lastmod>2026-05-16T02:17:39.089Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/sampling-distributions-in-yaml-configs</loc>
    <lastmod>2026-05-16T02:17:39.092Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/user-interface</loc>
    <lastmod>2026-05-16T02:17:39.094Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/using-local-tokenizers-without-hugging-face</loc>
    <lastmod>2026-05-16T02:17:39.097Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/random-number-generation-reproducibility</loc>
    <lastmod>2026-05-16T02:17:39.099Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/search-recipes</loc>
    <lastmod>2026-05-16T02:17:39.102Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/bayesian-optimization</loc>
    <lastmod>2026-05-16T02:17:39.104Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/space-filling-sweeps-sobol-latin-hypercube</loc>
    <lastmod>2026-05-16T02:17:39.107Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/load-generator-options-reference</loc>
    <lastmod>2026-05-16T02:17:39.109Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/trace-replay-with-mooncake-traces</loc>
    <lastmod>2026-05-16T02:17:39.111Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/conversation-dag-benchmarks</loc>
    <lastmod>2026-05-16T02:17:39.114Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/accuracy/accuracy-benchmarking</loc>
    <lastmod>2026-05-16T02:17:39.116Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/command-line-options</loc>
    <lastmod>2026-05-16T02:17:39.118Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/environment-variables</loc>
    <lastmod>2026-05-16T02:17:39.121Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/ai-perf-metrics-reference</loc>
    <lastmod>2026-05-16T02:17:39.123Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/benchmark-datasets</loc>
    <lastmod>2026-05-16T02:17:39.125Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/pre-flight-tokenizer-auto-detection</loc>
    <lastmod>2026-05-16T02:17:39.128Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/conversation-context-mode</loc>
    <lastmod>2026-05-16T02:17:39.130Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/list-metric-aggregation</loc>
    <lastmod>2026-05-16T02:17:39.133Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/vendor-usage-field-reference</loc>
    <lastmod>2026-05-16T02:17:39.135Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/json-export-schema</loc>
    <lastmod>2026-05-16T02:17:39.137Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/yaml-config-roadmap</loc>
    <lastmod>2026-05-16T02:17:39.140Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/server-metrics-collection</loc>
    <lastmod>2026-05-16T02:17:39.142Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-reference</loc>
    <lastmod>2026-05-16T02:17:39.145Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-json-export-schema</loc>
    <lastmod>2026-05-16T02:17:39.147Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-parquet-export-schema</loc>
    <lastmod>2026-05-16T02:17:39.149Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/ai-perf-plugin-system</loc>
    <lastmod>2026-05-16T02:17:39.152Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/creating-your-first-ai-perf-plugin</loc>
    <lastmod>2026-05-16T02:17:39.154Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/prefix-synthesis-api-reference</loc>
    <lastmod>2026-05-16T02:17:39.157Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/sweep-aggregates-api-reference</loc>
    <lastmod>2026-05-16T02:17:39.159Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/search-history-api-reference</loc>
    <lastmod>2026-05-16T02:17:39.161Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/architecture-of-ai-perf</loc>
    <lastmod>2026-05-16T02:17:39.164Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/metrics-flow</loc>
    <lastmod>2026-05-16T02:17:39.166Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/mixins</loc>
    <lastmod>2026-05-16T02:17:39.168Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/ai-perf-code-patterns</loc>
    <lastmod>2026-05-16T02:17:39.171Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/global-property-test-invariants</loc>
    <lastmod>2026-05-16T02:17:39.173Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/sweep-orchestrator-dev-reference</loc>
    <lastmod>2026-05-16T02:17:39.176Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/yaml-config-future-goals</loc>
    <lastmod>2026-05-16T02:17:39.178Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/troubleshooting/sweep-adaptive-search-errors</loc>
    <lastmod>2026-05-16T02:17:39.181Z</lastmod>
  </url>
</urlset>
