<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="https://www.sitemaps.org/schemas/sitemap/0.9">
  <url>
    <loc>https://docs.nvidia.com/aiperf/welcome-to-ai-perf-documentation</loc>
    <lastmod>2026-05-15T22:08:08.464Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/profiling-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.467Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/ai-perf-comprehensive-llm-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.468Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/migrating-from-gen-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.470Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/getting-started/gen-ai-perf-vs-ai-perf-cli-feature-comparison-matrix</loc>
    <lastmod>2026-05-15T22:08:08.472Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-open-ai-compatible-text-ap-is-using-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.473Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-the-open-ai-responses-api-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.474Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-hugging-face-tgi-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.476Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-vision-language-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.477Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-audio-language-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.478Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-asr-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.480Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-embedding-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.481Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-ranking-models-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.482Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/profile-nim-image-retrieval-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.484Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-generation</loc>
    <lastmod>2026-05-15T22:08:08.485Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-image-edit</loc>
    <lastmod>2026-05-15T22:08:08.486Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/sg-lang-video-generation</loc>
    <lastmod>2026-05-15T22:08:08.488Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/synthetic-video-generation</loc>
    <lastmod>2026-05-15T22:08:08.489Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/model-endpoint-guides/template-endpoint</loc>
    <lastmod>2026-05-15T22:08:08.490Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-dataset-guide</loc>
    <lastmod>2026-05-15T22:08:08.492Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inline-datasets</loc>
    <lastmod>2026-05-15T22:08:08.493Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/custom-prompt-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.494Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-share-gpt-dataset</loc>
    <lastmod>2026-05-15T22:08:08.495Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/synthetic-dataset-generation</loc>
    <lastmod>2026-05-15T22:08:08.497Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-instruct-coder-dataset</loc>
    <lastmod>2026-05-15T22:08:08.498Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-aimo-dataset</loc>
    <lastmod>2026-05-15T22:08:08.500Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mm-star-dataset</loc>
    <lastmod>2026-05-15T22:08:08.501Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-mmvu-dataset</loc>
    <lastmod>2026-05-15T22:08:08.502Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-l-la-va-one-vision-dataset</loc>
    <lastmod>2026-05-15T22:08:08.503Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-vision-arena-dataset</loc>
    <lastmod>2026-05-15T22:08:08.505Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-blazedit-dataset</loc>
    <lastmod>2026-05-15T22:08:08.506Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-spec-bench-dataset</loc>
    <lastmod>2026-05-15T22:08:08.507Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-speed-bench-dataset</loc>
    <lastmod>2026-05-15T22:08:08.508Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-bailian-traces</loc>
    <lastmod>2026-05-15T22:08:08.510Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/profile-with-burst-gpt-traces</loc>
    <lastmod>2026-05-15T22:08:08.511Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/replay-sage-maker-data-capture-traces</loc>
    <lastmod>2026-05-15T22:08:08.512Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/raw-payload-replay</loc>
    <lastmod>2026-05-15T22:08:08.514Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/inputs-json-replay</loc>
    <lastmod>2026-05-15T22:08:08.515Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/multi-turn-conversations</loc>
    <lastmod>2026-05-15T22:08:08.517Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/sequence-length-distributions-for-advanced-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.518Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/prefix-data-synthesis-tutorial</loc>
    <lastmod>2026-05-15T22:08:08.520Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/datasets-inputs/agentic-code-dataset-generator</loc>
    <lastmod>2026-05-15T22:08:08.521Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/arrival-patterns-simulating-realistic-traffic</loc>
    <lastmod>2026-05-15T22:08:08.523Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/fixed-schedule-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.524Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/gradual-ramping</loc>
    <lastmod>2026-05-15T22:08:08.525Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-rate-with-max-concurrency</loc>
    <lastmod>2026-05-15T22:08:08.526Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/prefill-concurrency-fine-grained-benchmarking-control</loc>
    <lastmod>2026-05-15T22:08:08.527Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/time-based-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.529Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/multi-url-load-balancing</loc>
    <lastmod>2026-05-15T22:08:08.530Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/request-cancellation-testing</loc>
    <lastmod>2026-05-15T22:08:08.531Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/load-patterns-scheduling/warmup-phase-configuration</loc>
    <lastmod>2026-05-15T22:08:08.532Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/benchmark-goodput-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.534Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/multi-run-confidence-reporting</loc>
    <lastmod>2026-05-15T22:08:08.535Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/parameter-sweeps</loc>
    <lastmod>2026-05-15T22:08:08.541Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/adaptive-search</loc>
    <lastmod>2026-05-15T22:08:08.542Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/time-slicing-for-performance-analysis</loc>
    <lastmod>2026-05-15T22:08:08.543Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/http-trace-metrics-guide</loc>
    <lastmod>2026-05-15T22:08:08.544Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/working-with-profile-export-files</loc>
    <lastmod>2026-05-15T22:08:08.546Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/visualization-and-plotting-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.547Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/auto-plot-after-aiperf-profile</loc>
    <lastmod>2026-05-15T22:08:08.548Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/user-centric-timing-for-kv-cache-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.549Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/gpu-telemetry-with-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.551Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/metrics-analysis/open-telemetry-m-lflow-integration</loc>
    <lastmod>2026-05-15T22:08:08.552Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/yaml-configuration-files</loc>
    <lastmod>2026-05-15T22:08:08.553Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/sampling-distributions-in-yaml-configs</loc>
    <lastmod>2026-05-15T22:08:08.554Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/user-interface</loc>
    <lastmod>2026-05-15T22:08:08.555Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/using-local-tokenizers-without-hugging-face</loc>
    <lastmod>2026-05-15T22:08:08.557Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/tutorials/configuration/random-number-generation-reproducibility</loc>
    <lastmod>2026-05-15T22:08:08.558Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/search-recipes</loc>
    <lastmod>2026-05-15T22:08:08.559Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/bayesian-optimization</loc>
    <lastmod>2026-05-15T22:08:08.560Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/sweeping-adaptive-search/space-filling-sweeps-sobol-latin-hypercube</loc>
    <lastmod>2026-05-15T22:08:08.561Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/load-generator-options-reference</loc>
    <lastmod>2026-05-15T22:08:08.563Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/trace-replay-with-mooncake-traces</loc>
    <lastmod>2026-05-15T22:08:08.564Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/benchmark-modes/conversation-dag-benchmarks</loc>
    <lastmod>2026-05-15T22:08:08.565Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/accuracy/accuracy-benchmarking</loc>
    <lastmod>2026-05-15T22:08:08.566Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/command-line-options</loc>
    <lastmod>2026-05-15T22:08:08.567Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/environment-variables</loc>
    <lastmod>2026-05-15T22:08:08.569Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/ai-perf-metrics-reference</loc>
    <lastmod>2026-05-15T22:08:08.570Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/benchmark-datasets</loc>
    <lastmod>2026-05-15T22:08:08.571Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/pre-flight-tokenizer-auto-detection</loc>
    <lastmod>2026-05-15T22:08:08.572Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/conversation-context-mode</loc>
    <lastmod>2026-05-15T22:08:08.574Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/list-metric-aggregation</loc>
    <lastmod>2026-05-15T22:08:08.575Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/vendor-usage-field-reference</loc>
    <lastmod>2026-05-15T22:08:08.576Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/json-export-schema</loc>
    <lastmod>2026-05-15T22:08:08.577Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/reference/yaml-config-roadmap</loc>
    <lastmod>2026-05-15T22:08:08.579Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/server-metrics-collection</loc>
    <lastmod>2026-05-15T22:08:08.580Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-reference</loc>
    <lastmod>2026-05-15T22:08:08.581Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-json-export-schema</loc>
    <lastmod>2026-05-15T22:08:08.583Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/server-metrics/ai-perf-server-metrics-parquet-export-schema</loc>
    <lastmod>2026-05-15T22:08:08.584Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/ai-perf-plugin-system</loc>
    <lastmod>2026-05-15T22:08:08.585Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/plugins/creating-your-first-ai-perf-plugin</loc>
    <lastmod>2026-05-15T22:08:08.586Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/prefix-synthesis-api-reference</loc>
    <lastmod>2026-05-15T22:08:08.588Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/sweep-aggregates-api-reference</loc>
    <lastmod>2026-05-15T22:08:08.589Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/api/search-history-api-reference</loc>
    <lastmod>2026-05-15T22:08:08.590Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/architecture-of-ai-perf</loc>
    <lastmod>2026-05-15T22:08:08.592Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/metrics-flow</loc>
    <lastmod>2026-05-15T22:08:08.593Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/mixins</loc>
    <lastmod>2026-05-15T22:08:08.594Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/ai-perf-code-patterns</loc>
    <lastmod>2026-05-15T22:08:08.595Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/global-property-test-invariants</loc>
    <lastmod>2026-05-15T22:08:08.596Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/sweep-orchestrator-dev-reference</loc>
    <lastmod>2026-05-15T22:08:08.598Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/architecture-internals/yaml-config-future-goals</loc>
    <lastmod>2026-05-15T22:08:08.599Z</lastmod>
  </url>
  <url>
    <loc>https://docs.nvidia.com/aiperf/troubleshooting/sweep-adaptive-search-errors</loc>
    <lastmod>2026-05-15T22:08:08.600Z</lastmod>
  </url>
</urlset>
