From 206fc79cc9a5b6fac97a39e17630837f3d69033d Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 1 May 2025 14:45:09 -0400
Subject: [PATCH 01/18] Second Scenario implmentation attempt

---
 src/guidellm/__main__.py              | 118 ++++++++++++++++++--------
 src/guidellm/benchmark/entrypoints.py |  14 +++
 src/guidellm/benchmark/scenario.py    |  62 ++++++++++++++
 3 files changed, 160 insertions(+), 34 deletions(-)
 create mode 100644 src/guidellm/benchmark/scenario.py

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 7dc068359..cae1e4b51 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -7,7 +7,9 @@
 import click
 
 from guidellm.backend import BackendType
-from guidellm.benchmark import ProfileType, benchmark_generative_text
+from guidellm.benchmark import ProfileType
+from guidellm.benchmark.entrypoints import benchmark_with_scenario
+from guidellm.benchmark.scenario import GenerativeTextScenario
 from guidellm.config import print_config
 from guidellm.preprocess.dataset import ShortPromptStrategy, process_dataset
 from guidellm.scheduler import StrategyType
@@ -40,6 +42,19 @@ def parse_number_str(ctx, param, value):  # noqa: ARG001
         ) from err
 
 
+def set_if_not_default(ctx: click.Context, **kwargs):
+    """
+    Set the value of a click option if it is not the default value.
+    This is useful for setting options that are not None by default.
+    """
+    values = {}
+    for k, v in kwargs.items():
+        if ctx.get_parameter_source(k) != click.core.ParameterSource.DEFAULT:
+            values[k] = v
+
+    return values
+
+
 @click.group()
 def cli():
     pass
@@ -48,6 +63,14 @@ def cli():
 @cli.command(
     help="Run a benchmark against a generative model using the specified arguments."
 )
+@click.option(
+    "--scenario",
+    type=str,
+    default=None,
+    help=(
+        "TODO: A scenario or path to config"
+    ),
+)
 @click.option(
     "--target",
     required=True,
@@ -61,12 +84,12 @@ def cli():
         "The type of backend to use to run requests against. Defaults to 'openai_http'."
         f" Supported types: {', '.join(get_args(BackendType))}"
     ),
-    default="openai_http",
+    default=GenerativeTextScenario.backend_type,
 )
 @click.option(
     "--backend-args",
     callback=parse_json,
-    default=None,
+    default=GenerativeTextScenario.backend_args,
     help=(
         "A JSON string containing any arguments to pass to the backend as a "
         "dict with **kwargs."
@@ -74,7 +97,7 @@ def cli():
 )
 @click.option(
     "--model",
-    default=None,
+    default=GenerativeTextScenario.model,
     type=str,
     help=(
         "The ID of the model to benchmark within the backend. "
@@ -83,7 +106,7 @@ def cli():
 )
 @click.option(
     "--processor",
-    default=None,
+    default=GenerativeTextScenario.processor,
     type=str,
     help=(
         "The processor or tokenizer to use to calculate token counts for statistics "
@@ -93,7 +116,7 @@ def cli():
 )
 @click.option(
     "--processor-args",
-    default=None,
+    default=GenerativeTextScenario.processor_args,
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the processor constructor "
@@ -112,6 +135,7 @@ def cli():
 )
 @click.option(
     "--data-args",
+    default=GenerativeTextScenario.data_args,
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the dataset creation "
@@ -120,7 +144,7 @@ def cli():
 )
 @click.option(
     "--data-sampler",
-    default=None,
+    default=GenerativeTextScenario.data_sampler,
     type=click.Choice(["random"]),
     help=(
         "The data sampler type to use. 'random' will add a random shuffle on the data. "
@@ -138,7 +162,7 @@ def cli():
 )
 @click.option(
     "--rate",
-    default=None,
+    default=GenerativeTextScenario.rate,
     callback=parse_number_str,
     help=(
         "The rates to run the benchmark at. "
@@ -152,6 +176,7 @@ def cli():
 @click.option(
     "--max-seconds",
     type=float,
+    default=GenerativeTextScenario.max_seconds,
     help=(
         "The maximum number of seconds each benchmark can run for. "
         "If None, will run until max_requests or the data is exhausted."
@@ -160,6 +185,7 @@ def cli():
 @click.option(
     "--max-requests",
     type=int,
+    default=GenerativeTextScenario.max_requests,
     help=(
         "The maximum number of requests each benchmark can run for. "
         "If None, will run until max_seconds or the data is exhausted."
@@ -168,7 +194,7 @@ def cli():
 @click.option(
     "--warmup-percent",
     type=float,
-    default=None,
+    default=GenerativeTextScenario.warmup_percent,
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, "
         "or lenth of dataset) to run as a warmup and not include in the final results. "
@@ -178,6 +204,7 @@ def cli():
 @click.option(
     "--cooldown-percent",
     type=float,
+    default=GenerativeTextScenario.cooldown_percent,
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, or lenth "
         "of dataset) to run as a cooldown and not include in the final results. "
@@ -187,16 +214,19 @@ def cli():
 @click.option(
     "--disable-progress",
     is_flag=True,
+    default=not GenerativeTextScenario.show_progress,
     help="Set this flag to disable progress updates to the console",
 )
 @click.option(
     "--display-scheduler-stats",
     is_flag=True,
+    default=GenerativeTextScenario.show_progress_scheduler_stats,
     help="Set this flag to display stats for the processes running the benchmarks",
 )
 @click.option(
     "--disable-console-outputs",
     is_flag=True,
+    default=not GenerativeTextScenario.output_console,
     help="Set this flag to disable console output",
 )
 @click.option(
@@ -213,6 +243,7 @@ def cli():
 @click.option(
     "--output-extras",
     callback=parse_json,
+    default=GenerativeTextScenario.output_extras,
     help="A JSON string of extra data to save with the output benchmarks",
 )
 @click.option(
@@ -222,15 +253,16 @@ def cli():
         "The number of samples to save in the output file. "
         "If None (default), will save all samples."
     ),
-    default=None,
+    default=GenerativeTextScenario.output_sampling,
 )
 @click.option(
     "--random-seed",
-    default=42,
+    default=GenerativeTextScenario.random_seed,
     type=int,
     help="The random seed to use for benchmarking to ensure reproducibility.",
 )
 def benchmark(
+    scenario,
     target,
     backend_type,
     backend_args,
@@ -254,30 +286,48 @@ def benchmark(
     output_sampling,
     random_seed,
 ):
+    click_ctx = click.get_current_context()
+
+    # If a scenario file was specified read from it
+    # TODO: This should probably be a factory method
+    if scenario is None:
+        _scenario = {}
+    else:
+        # TODO: Support pre-defined scenarios
+        # TODO: Support other formats
+        with Path(scenario).open() as f:
+            _scenario = json.load(f)
+
+    # If any command line arguments are specified, override the scenario
+    _scenario.update(set_if_not_default(
+        click_ctx,
+        target=target,
+        backend_type=backend_type,
+        backend_args=backend_args,
+        model=model,
+        processor=processor,
+        processor_args=processor_args,
+        data=data,
+        data_args=data_args,
+        data_sampler=data_sampler,
+        rate_type=rate_type,
+        rate=rate,
+        max_seconds=max_seconds,
+        max_requests=max_requests,
+        warmup_percent=warmup_percent,
+        cooldown_percent=cooldown_percent,
+        show_progress=not disable_progress,
+        show_progress_scheduler_stats=display_scheduler_stats,
+        output_console=not disable_console_outputs,
+        output_path=output_path,
+        output_extras=output_extras,
+        output_sampling=output_sampling,
+        random_seed=random_seed,
+    ))
+
     asyncio.run(
-        benchmark_generative_text(
-            target=target,
-            backend_type=backend_type,
-            backend_args=backend_args,
-            model=model,
-            processor=processor,
-            processor_args=processor_args,
-            data=data,
-            data_args=data_args,
-            data_sampler=data_sampler,
-            rate_type=rate_type,
-            rate=rate,
-            max_seconds=max_seconds,
-            max_requests=max_requests,
-            warmup_percent=warmup_percent,
-            cooldown_percent=cooldown_percent,
-            show_progress=not disable_progress,
-            show_progress_scheduler_stats=display_scheduler_stats,
-            output_console=not disable_console_outputs,
-            output_path=output_path,
-            output_extras=output_extras,
-            output_sampling=output_sampling,
-            random_seed=random_seed,
+        benchmark_with_scenario(
+            scenario=GenerativeTextScenario(**_scenario)
         )
     )
 
diff --git a/src/guidellm/benchmark/entrypoints.py b/src/guidellm/benchmark/entrypoints.py
index 2f6c7182f..421904a2c 100644
--- a/src/guidellm/benchmark/entrypoints.py
+++ b/src/guidellm/benchmark/entrypoints.py
@@ -15,9 +15,23 @@
 )
 from guidellm.benchmark.profile import ProfileType, create_profile
 from guidellm.benchmark.progress import GenerativeTextBenchmarkerProgressDisplay
+from guidellm.benchmark.scenario import GenerativeTextScenario, Scenario
 from guidellm.request import GenerativeRequestLoader
 from guidellm.scheduler import StrategyType
 
+type benchmark_type = Literal["generative_text"]
+
+
+async def benchmark_with_scenario(scenario: Scenario, **kwargs):
+    """
+    Run a benchmark using a scenario and specify any extra arguments
+    """
+
+    if isinstance(scenario, GenerativeTextScenario):
+        return await benchmark_generative_text(**vars(scenario), **kwargs)
+    else:
+        raise ValueError(f"Unsupported Scenario type {type(scenario)}")
+
 
 async def benchmark_generative_text(
     target: str,
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
new file mode 100644
index 000000000..1bd2dc060
--- /dev/null
+++ b/src/guidellm/benchmark/scenario.py
@@ -0,0 +1,62 @@
+from collections.abc import Iterable
+from pathlib import Path
+from typing import Any, Literal, Optional, Self, Union
+
+from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
+from transformers.tokenization_utils_base import (  # type: ignore[import]
+    PreTrainedTokenizerBase,
+)
+
+from guidellm.backend.backend import BackendType
+from guidellm.benchmark.profile import ProfileType
+from guidellm.objects.pydantic import StandardBaseModel
+from guidellm.scheduler.strategy import StrategyType
+
+__ALL__ = ["Scenario", "GenerativeTextScenario"]
+
+
+class Scenario(StandardBaseModel):
+    target: str
+
+    def _update(self, **fields: Any) -> Self:
+        for k, v in fields.items():
+            if not hasattr(self, k):
+                raise ValueError(f"Invalid field {k}")
+            setattr(self, k, v)
+
+        return self
+
+    def update(self, **fields: Any) -> Self:
+        return self._update(**{k: v for k, v in fields.items() if v is not None})
+
+
+class GenerativeTextScenario(Scenario):
+    backend_type: BackendType = "openai_http"
+    backend_args: Optional[dict[str, Any]] = None
+    model: Optional[str] = None
+    processor: Optional[Union[str, Path, PreTrainedTokenizerBase]] = None
+    processor_args: Optional[dict[str, Any]] = None
+    data: Union[
+        str,
+        Path,
+        Iterable[Union[str, dict[str, Any]]],
+        Dataset,
+        DatasetDict,
+        IterableDataset,
+        IterableDatasetDict,
+    ]
+    data_args: Optional[dict[str, Any]] = None
+    data_sampler: Optional[Literal["random"]] = None
+    rate_type: Union[StrategyType, ProfileType]
+    rate: Optional[Union[int, float, list[Union[int, float]]]] = None
+    max_seconds: Optional[float] = None
+    max_requests: Optional[int] = None
+    warmup_percent: Optional[float] = None
+    cooldown_percent: Optional[float] = None
+    show_progress: bool = True
+    show_progress_scheduler_stats: bool = True
+    output_console: bool = True
+    output_path: Optional[Union[str, Path]] = None
+    output_extras: Optional[dict[str, Any]] = None
+    output_sampling: Optional[int] = None
+    random_seed: int = 42

From 06e6ff0f983496ef4e5b37cc602a1ddc3d011745 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 1 May 2025 15:07:45 -0400
Subject: [PATCH 02/18] Fix pydantic model parsing issues

---
 src/guidellm/__main__.py           | 36 +++++++++++++++---------------
 src/guidellm/benchmark/scenario.py |  4 ++++
 2 files changed, 22 insertions(+), 18 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index cae1e4b51..7d34fd693 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -84,12 +84,12 @@ def cli():
         "The type of backend to use to run requests against. Defaults to 'openai_http'."
         f" Supported types: {', '.join(get_args(BackendType))}"
     ),
-    default=GenerativeTextScenario.backend_type,
+    default=GenerativeTextScenario.model_fields["backend_type"].default,
 )
 @click.option(
     "--backend-args",
     callback=parse_json,
-    default=GenerativeTextScenario.backend_args,
+    default=GenerativeTextScenario.model_fields["backend_args"].default,
     help=(
         "A JSON string containing any arguments to pass to the backend as a "
         "dict with **kwargs."
@@ -97,7 +97,7 @@ def cli():
 )
 @click.option(
     "--model",
-    default=GenerativeTextScenario.model,
+    default=GenerativeTextScenario.model_fields["model"].default,
     type=str,
     help=(
         "The ID of the model to benchmark within the backend. "
@@ -106,7 +106,7 @@ def cli():
 )
 @click.option(
     "--processor",
-    default=GenerativeTextScenario.processor,
+    default=GenerativeTextScenario.model_fields["processor"].default,
     type=str,
     help=(
         "The processor or tokenizer to use to calculate token counts for statistics "
@@ -116,7 +116,7 @@ def cli():
 )
 @click.option(
     "--processor-args",
-    default=GenerativeTextScenario.processor_args,
+    default=GenerativeTextScenario.model_fields["processor_args"].default,
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the processor constructor "
@@ -135,7 +135,7 @@ def cli():
 )
 @click.option(
     "--data-args",
-    default=GenerativeTextScenario.data_args,
+    default=GenerativeTextScenario.model_fields["data_args"].default,
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the dataset creation "
@@ -144,7 +144,7 @@ def cli():
 )
 @click.option(
     "--data-sampler",
-    default=GenerativeTextScenario.data_sampler,
+    default=GenerativeTextScenario.model_fields["data_sampler"].default,
     type=click.Choice(["random"]),
     help=(
         "The data sampler type to use. 'random' will add a random shuffle on the data. "
@@ -162,7 +162,7 @@ def cli():
 )
 @click.option(
     "--rate",
-    default=GenerativeTextScenario.rate,
+    default=GenerativeTextScenario.model_fields["rate"].default,
     callback=parse_number_str,
     help=(
         "The rates to run the benchmark at. "
@@ -176,7 +176,7 @@ def cli():
 @click.option(
     "--max-seconds",
     type=float,
-    default=GenerativeTextScenario.max_seconds,
+    default=GenerativeTextScenario.model_fields["max_seconds"].default,
     help=(
         "The maximum number of seconds each benchmark can run for. "
         "If None, will run until max_requests or the data is exhausted."
@@ -185,7 +185,7 @@ def cli():
 @click.option(
     "--max-requests",
     type=int,
-    default=GenerativeTextScenario.max_requests,
+    default=GenerativeTextScenario.model_fields["max_requests"].default,
     help=(
         "The maximum number of requests each benchmark can run for. "
         "If None, will run until max_seconds or the data is exhausted."
@@ -194,7 +194,7 @@ def cli():
 @click.option(
     "--warmup-percent",
     type=float,
-    default=GenerativeTextScenario.warmup_percent,
+    default=GenerativeTextScenario.model_fields["warmup_percent"].default,
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, "
         "or lenth of dataset) to run as a warmup and not include in the final results. "
@@ -204,7 +204,7 @@ def cli():
 @click.option(
     "--cooldown-percent",
     type=float,
-    default=GenerativeTextScenario.cooldown_percent,
+    default=GenerativeTextScenario.model_fields["cooldown_percent"].default,
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, or lenth "
         "of dataset) to run as a cooldown and not include in the final results. "
@@ -214,19 +214,19 @@ def cli():
 @click.option(
     "--disable-progress",
     is_flag=True,
-    default=not GenerativeTextScenario.show_progress,
+    default=not GenerativeTextScenario.model_fields["show_progress"].default,
     help="Set this flag to disable progress updates to the console",
 )
 @click.option(
     "--display-scheduler-stats",
     is_flag=True,
-    default=GenerativeTextScenario.show_progress_scheduler_stats,
+    default=GenerativeTextScenario.model_fields["show_progress_scheduler_stats"].default,
     help="Set this flag to display stats for the processes running the benchmarks",
 )
 @click.option(
     "--disable-console-outputs",
     is_flag=True,
-    default=not GenerativeTextScenario.output_console,
+    default=not GenerativeTextScenario.model_fields["output_console"].default,
     help="Set this flag to disable console output",
 )
 @click.option(
@@ -243,7 +243,7 @@ def cli():
 @click.option(
     "--output-extras",
     callback=parse_json,
-    default=GenerativeTextScenario.output_extras,
+    default=GenerativeTextScenario.model_fields["output_extras"].default,
     help="A JSON string of extra data to save with the output benchmarks",
 )
 @click.option(
@@ -253,11 +253,11 @@ def cli():
         "The number of samples to save in the output file. "
         "If None (default), will save all samples."
     ),
-    default=GenerativeTextScenario.output_sampling,
+    default=GenerativeTextScenario.model_fields["output_sampling"].default,
 )
 @click.option(
     "--random-seed",
-    default=GenerativeTextScenario.random_seed,
+    default=GenerativeTextScenario.model_fields["random_seed"].default,
     type=int,
     help="The random seed to use for benchmarking to ensure reproducibility.",
 )
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 1bd2dc060..6bea9f7da 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -31,6 +31,10 @@ def update(self, **fields: Any) -> Self:
 
 
 class GenerativeTextScenario(Scenario):
+    # FIXME: This solves an issue with Pydantic and class types
+    class Config:
+        arbitrary_types_allowed = True
+
     backend_type: BackendType = "openai_http"
     backend_args: Optional[dict[str, Any]] = None
     model: Optional[str] = None

From c11cc7f2674486d7d671ece40abd37eb16ebcfe2 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 1 May 2025 15:16:38 -0400
Subject: [PATCH 03/18] Move CLI and output options out of scenario

---
 src/guidellm/__main__.py           | 16 ++++++----------
 src/guidellm/benchmark/scenario.py |  5 -----
 2 files changed, 6 insertions(+), 15 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 7d34fd693..3734ac9d6 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -214,19 +214,16 @@ def cli():
 @click.option(
     "--disable-progress",
     is_flag=True,
-    default=not GenerativeTextScenario.model_fields["show_progress"].default,
     help="Set this flag to disable progress updates to the console",
 )
 @click.option(
     "--display-scheduler-stats",
     is_flag=True,
-    default=GenerativeTextScenario.model_fields["show_progress_scheduler_stats"].default,
     help="Set this flag to display stats for the processes running the benchmarks",
 )
 @click.option(
     "--disable-console-outputs",
     is_flag=True,
-    default=not GenerativeTextScenario.model_fields["output_console"].default,
     help="Set this flag to disable console output",
 )
 @click.option(
@@ -243,7 +240,6 @@ def cli():
 @click.option(
     "--output-extras",
     callback=parse_json,
-    default=GenerativeTextScenario.model_fields["output_extras"].default,
     help="A JSON string of extra data to save with the output benchmarks",
 )
 @click.option(
@@ -316,18 +312,18 @@ def benchmark(
         max_requests=max_requests,
         warmup_percent=warmup_percent,
         cooldown_percent=cooldown_percent,
-        show_progress=not disable_progress,
-        show_progress_scheduler_stats=display_scheduler_stats,
-        output_console=not disable_console_outputs,
-        output_path=output_path,
-        output_extras=output_extras,
         output_sampling=output_sampling,
         random_seed=random_seed,
     ))
 
     asyncio.run(
         benchmark_with_scenario(
-            scenario=GenerativeTextScenario(**_scenario)
+            scenario=GenerativeTextScenario(**_scenario),
+            show_progress=not disable_progress,
+            show_progress_scheduler_stats=display_scheduler_stats,
+            output_console=not disable_console_outputs,
+            output_path=output_path,
+            output_extras=output_extras,
         )
     )
 
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 6bea9f7da..2d8748f79 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -57,10 +57,5 @@ class Config:
     max_requests: Optional[int] = None
     warmup_percent: Optional[float] = None
     cooldown_percent: Optional[float] = None
-    show_progress: bool = True
-    show_progress_scheduler_stats: bool = True
-    output_console: bool = True
-    output_path: Optional[Union[str, Path]] = None
-    output_extras: Optional[dict[str, Any]] = None
     output_sampling: Optional[int] = None
     random_seed: int = 42

From 2411d4edd93e5710697b5652372cb4de51ca45ce Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Wed, 21 May 2025 13:51:29 -0400
Subject: [PATCH 04/18] Drop int type from rate

---
 src/guidellm/benchmark/scenario.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 2d8748f79..8c5106a4c 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -52,7 +52,7 @@ class Config:
     data_args: Optional[dict[str, Any]] = None
     data_sampler: Optional[Literal["random"]] = None
     rate_type: Union[StrategyType, ProfileType]
-    rate: Optional[Union[int, float, list[Union[int, float]]]] = None
+    rate: Optional[Union[float, list[float]]] = None
     max_seconds: Optional[float] = None
     max_requests: Optional[int] = None
     warmup_percent: Optional[float] = None

From 603a1f86d85af932203301351d05da7e1e90de76 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Wed, 21 May 2025 15:41:19 -0400
Subject: [PATCH 05/18] Handle reading scenario from file in factory method

---
 src/guidellm/__main__.py           | 24 ++++++++++-------------
 src/guidellm/benchmark/scenario.py | 31 ++++++++++++++++++++----------
 2 files changed, 31 insertions(+), 24 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 3734ac9d6..fb0b89aa7 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -284,18 +284,7 @@ def benchmark(
 ):
     click_ctx = click.get_current_context()
 
-    # If a scenario file was specified read from it
-    # TODO: This should probably be a factory method
-    if scenario is None:
-        _scenario = {}
-    else:
-        # TODO: Support pre-defined scenarios
-        # TODO: Support other formats
-        with Path(scenario).open() as f:
-            _scenario = json.load(f)
-
-    # If any command line arguments are specified, override the scenario
-    _scenario.update(set_if_not_default(
+    overrides = set_if_not_default(
         click_ctx,
         target=target,
         backend_type=backend_type,
@@ -314,11 +303,18 @@ def benchmark(
         cooldown_percent=cooldown_percent,
         output_sampling=output_sampling,
         random_seed=random_seed,
-    ))
+    )
+
+    # If a scenario file was specified read from it
+    if scenario is None:
+        _scenario = GenerativeTextScenario.model_validate(overrides)
+    else:
+        # TODO: Support pre-defined scenarios
+        _scenario = GenerativeTextScenario.from_file(scenario, overrides)
 
     asyncio.run(
         benchmark_with_scenario(
-            scenario=GenerativeTextScenario(**_scenario),
+            scenario=_scenario,
             show_progress=not disable_progress,
             show_progress_scheduler_stats=display_scheduler_stats,
             output_console=not disable_console_outputs,
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 8c5106a4c..b8e9f5043 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -1,8 +1,11 @@
+import json
 from collections.abc import Iterable
 from pathlib import Path
-from typing import Any, Literal, Optional, Self, Union
+from typing import Any, Literal, Optional, TypeVar, Union
 
+import yaml
 from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
+from loguru import logger
 from transformers.tokenization_utils_base import (  # type: ignore[import]
     PreTrainedTokenizerBase,
 )
@@ -14,20 +17,28 @@
 
 __ALL__ = ["Scenario", "GenerativeTextScenario"]
 
+T = TypeVar("T", bound="Scenario")
+
 
 class Scenario(StandardBaseModel):
     target: str
 
-    def _update(self, **fields: Any) -> Self:
-        for k, v in fields.items():
-            if not hasattr(self, k):
-                raise ValueError(f"Invalid field {k}")
-            setattr(self, k, v)
-
-        return self
+    @classmethod
+    def from_file(
+        cls: type[T], filename: Union[str, Path], overrides: Optional[dict] = None
+    ) -> T:
+        try:
+            with open(filename) as f:
+                if str(filename).endswith(".yaml") or str(filename).endswith(".yml"):
+                    data = yaml.safe_load(f)
+                else:  # Assume everything else is json
+                    data = json.load(f)
+        except (json.JSONDecodeError, yaml.YAMLError) as e:
+            logger.error("Failed to parse scenario")
+            raise e
 
-    def update(self, **fields: Any) -> Self:
-        return self._update(**{k: v for k, v in fields.items() if v is not None})
+        data.update(overrides)
+        return cls.model_validate(data)
 
 
 class GenerativeTextScenario(Scenario):

From c8965071cab042253e2c08a5b1327fd7d970453e Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Wed, 21 May 2025 15:56:35 -0400
Subject: [PATCH 06/18] Handle required arg parsing with pydantic

---
 src/guidellm/__main__.py | 27 +++++++++++++++------------
 1 file changed, 15 insertions(+), 12 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index fb0b89aa7..a1b0de072 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -5,6 +5,7 @@
 from typing import get_args
 
 import click
+from pydantic import ValidationError
 
 from guidellm.backend import BackendType
 from guidellm.benchmark import ProfileType
@@ -67,13 +68,10 @@ def cli():
     "--scenario",
     type=str,
     default=None,
-    help=(
-        "TODO: A scenario or path to config"
-    ),
+    help=("TODO: A scenario or path to config"),
 )
 @click.option(
     "--target",
-    required=True,
     type=str,
     help="The target path for the backend to run benchmarks against. For example, http://localhost:8000",
 )
@@ -125,7 +123,6 @@ def cli():
 )
 @click.option(
     "--data",
-    required=True,
     type=str,
     help=(
         "The HuggingFace dataset ID, a path to a HuggingFace dataset, "
@@ -153,7 +150,6 @@ def cli():
 )
 @click.option(
     "--rate-type",
-    required=True,
     type=click.Choice(STRATEGY_PROFILE_CHOICES),
     help=(
         "The type of benchmark to run. "
@@ -305,12 +301,19 @@ def benchmark(
         random_seed=random_seed,
     )
 
-    # If a scenario file was specified read from it
-    if scenario is None:
-        _scenario = GenerativeTextScenario.model_validate(overrides)
-    else:
-        # TODO: Support pre-defined scenarios
-        _scenario = GenerativeTextScenario.from_file(scenario, overrides)
+    try:
+        # If a scenario file was specified read from it
+        if scenario is None:
+            _scenario = GenerativeTextScenario.model_validate(overrides)
+        else:
+            # TODO: Support pre-defined scenarios
+            _scenario = GenerativeTextScenario.from_file(scenario, overrides)
+    except ValidationError as e:
+        errs = e.errors(include_url=False, include_context=True, include_input=True)
+        param_name = "--" + str(errs[0]["loc"][0]).replace("_", "-")
+        raise click.BadParameter(
+            errs[0]["msg"], ctx=click_ctx, param_hint=param_name
+        ) from e
 
     asyncio.run(
         benchmark_with_scenario(

From ef514632aaeb375910213101e357e35ef02a35da Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Wed, 21 May 2025 16:20:28 -0400
Subject: [PATCH 07/18] Move rate string parsing into scenario

---
 src/guidellm/__main__.py           | 15 ---------------
 src/guidellm/benchmark/scenario.py | 22 ++++++++++++++++++++--
 2 files changed, 20 insertions(+), 17 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index a1b0de072..89a3daa79 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -29,20 +29,6 @@ def parse_json(ctx, param, value):  # noqa: ARG001
         raise click.BadParameter(f"{param.name} must be a valid JSON string.") from err
 
 
-def parse_number_str(ctx, param, value):  # noqa: ARG001
-    if value is None:
-        return None
-
-    values = value.split(",") if "," in value else [value]
-
-    try:
-        return [float(val) for val in values]
-    except ValueError as err:
-        raise click.BadParameter(
-            f"{param.name} must be a number or comma-separated list of numbers."
-        ) from err
-
-
 def set_if_not_default(ctx: click.Context, **kwargs):
     """
     Set the value of a click option if it is not the default value.
@@ -159,7 +145,6 @@ def cli():
 @click.option(
     "--rate",
     default=GenerativeTextScenario.model_fields["rate"].default,
-    callback=parse_number_str,
     help=(
         "The rates to run the benchmark at. "
         "Can be a single number or a comma-separated list of numbers. "
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index b8e9f5043..648722980 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -1,11 +1,12 @@
 import json
 from collections.abc import Iterable
 from pathlib import Path
-from typing import Any, Literal, Optional, TypeVar, Union
+from typing import Annotated, Any, Literal, Optional, TypeVar, Union
 
 import yaml
 from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
 from loguru import logger
+from pydantic import BeforeValidator
 from transformers.tokenization_utils_base import (  # type: ignore[import]
     PreTrainedTokenizerBase,
 )
@@ -17,6 +18,23 @@
 
 __ALL__ = ["Scenario", "GenerativeTextScenario"]
 
+
+def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
+    if isinstance(value, (int, float)):
+        return [value]
+    elif isinstance(value, list):
+        return value
+
+    values = value.split(",") if "," in value else [value]
+
+    try:
+        return [float(val) for val in values]
+    except ValueError as err:
+        raise ValueError(
+            "must be a number or comma-separated list of numbers."
+        ) from err
+
+
 T = TypeVar("T", bound="Scenario")
 
 
@@ -63,7 +81,7 @@ class Config:
     data_args: Optional[dict[str, Any]] = None
     data_sampler: Optional[Literal["random"]] = None
     rate_type: Union[StrategyType, ProfileType]
-    rate: Optional[Union[float, list[float]]] = None
+    rate: Annotated[Optional[list[float]], BeforeValidator(parse_float_list)] = None
     max_seconds: Optional[float] = None
     max_requests: Optional[int] = None
     warmup_percent: Optional[float] = None

From 511e9f2695f214b91170e23b9457708f4b6ff1e1 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Wed, 21 May 2025 16:54:38 -0400
Subject: [PATCH 08/18] Annotate scenario number fields with bounds checks

---
 src/guidellm/benchmark/scenario.py | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 648722980..36f2fbd4b 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -6,7 +6,7 @@
 import yaml
 from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
 from loguru import logger
-from pydantic import BeforeValidator
+from pydantic import BeforeValidator, Field, NonNegativeInt, PositiveFloat, PositiveInt
 from transformers.tokenization_utils_base import (  # type: ignore[import]
     PreTrainedTokenizerBase,
 )
@@ -81,10 +81,12 @@ class Config:
     data_args: Optional[dict[str, Any]] = None
     data_sampler: Optional[Literal["random"]] = None
     rate_type: Union[StrategyType, ProfileType]
-    rate: Annotated[Optional[list[float]], BeforeValidator(parse_float_list)] = None
-    max_seconds: Optional[float] = None
-    max_requests: Optional[int] = None
-    warmup_percent: Optional[float] = None
-    cooldown_percent: Optional[float] = None
-    output_sampling: Optional[int] = None
+    rate: Annotated[
+        Optional[list[PositiveFloat]], BeforeValidator(parse_float_list)
+    ] = None
+    max_seconds: Optional[PositiveFloat] = None
+    max_requests: Optional[PositiveInt] = None
+    warmup_percent: Annotated[Optional[float], Field(gt=0, le=1)] = None
+    cooldown_percent: Annotated[Optional[float], Field(gt=0, le=1)] = None
+    output_sampling: Optional[NonNegativeInt] = None
     random_seed: int = 42

From c8db1be3a7ec0e8ba6f9801deec62736ad0db046 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 22 May 2025 12:48:49 -0400
Subject: [PATCH 09/18] Add a helper method to get scenario defaults

---
 src/guidellm/__main__.py              | 32 +++++++++++++--------------
 src/guidellm/benchmark/entrypoints.py |  2 --
 src/guidellm/benchmark/scenario.py    |  5 +++++
 3 files changed, 21 insertions(+), 18 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 89a3daa79..cbecf9aeb 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -2,7 +2,7 @@
 import codecs
 import json
 from pathlib import Path
-from typing import get_args
+from typing import Any, get_args
 
 import click
 from pydantic import ValidationError
@@ -29,7 +29,7 @@ def parse_json(ctx, param, value):  # noqa: ARG001
         raise click.BadParameter(f"{param.name} must be a valid JSON string.") from err
 
 
-def set_if_not_default(ctx: click.Context, **kwargs):
+def set_if_not_default(ctx: click.Context, **kwargs) -> dict[str, Any]:
     """
     Set the value of a click option if it is not the default value.
     This is useful for setting options that are not None by default.
@@ -68,12 +68,12 @@ def cli():
         "The type of backend to use to run requests against. Defaults to 'openai_http'."
         f" Supported types: {', '.join(get_args(BackendType))}"
     ),
-    default=GenerativeTextScenario.model_fields["backend_type"].default,
+    default=GenerativeTextScenario.get_default("backend_type"),
 )
 @click.option(
     "--backend-args",
     callback=parse_json,
-    default=GenerativeTextScenario.model_fields["backend_args"].default,
+    default=GenerativeTextScenario.get_default("backend_args"),
     help=(
         "A JSON string containing any arguments to pass to the backend as a "
         "dict with **kwargs."
@@ -81,7 +81,7 @@ def cli():
 )
 @click.option(
     "--model",
-    default=GenerativeTextScenario.model_fields["model"].default,
+    default=GenerativeTextScenario.get_default("model"),
     type=str,
     help=(
         "The ID of the model to benchmark within the backend. "
@@ -90,7 +90,7 @@ def cli():
 )
 @click.option(
     "--processor",
-    default=GenerativeTextScenario.model_fields["processor"].default,
+    default=GenerativeTextScenario.get_default("processor"),
     type=str,
     help=(
         "The processor or tokenizer to use to calculate token counts for statistics "
@@ -100,7 +100,7 @@ def cli():
 )
 @click.option(
     "--processor-args",
-    default=GenerativeTextScenario.model_fields["processor_args"].default,
+    default=GenerativeTextScenario.get_default("processor_args"),
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the processor constructor "
@@ -118,7 +118,7 @@ def cli():
 )
 @click.option(
     "--data-args",
-    default=GenerativeTextScenario.model_fields["data_args"].default,
+    default=GenerativeTextScenario.get_default("data_args"),
     callback=parse_json,
     help=(
         "A JSON string containing any arguments to pass to the dataset creation "
@@ -127,7 +127,7 @@ def cli():
 )
 @click.option(
     "--data-sampler",
-    default=GenerativeTextScenario.model_fields["data_sampler"].default,
+    default=GenerativeTextScenario.get_default("data_sampler"),
     type=click.Choice(["random"]),
     help=(
         "The data sampler type to use. 'random' will add a random shuffle on the data. "
@@ -144,7 +144,7 @@ def cli():
 )
 @click.option(
     "--rate",
-    default=GenerativeTextScenario.model_fields["rate"].default,
+    default=GenerativeTextScenario.get_default("rate"),
     help=(
         "The rates to run the benchmark at. "
         "Can be a single number or a comma-separated list of numbers. "
@@ -157,7 +157,7 @@ def cli():
 @click.option(
     "--max-seconds",
     type=float,
-    default=GenerativeTextScenario.model_fields["max_seconds"].default,
+    default=GenerativeTextScenario.get_default("max_seconds"),
     help=(
         "The maximum number of seconds each benchmark can run for. "
         "If None, will run until max_requests or the data is exhausted."
@@ -166,7 +166,7 @@ def cli():
 @click.option(
     "--max-requests",
     type=int,
-    default=GenerativeTextScenario.model_fields["max_requests"].default,
+    default=GenerativeTextScenario.get_default("max_requests"),
     help=(
         "The maximum number of requests each benchmark can run for. "
         "If None, will run until max_seconds or the data is exhausted."
@@ -175,7 +175,7 @@ def cli():
 @click.option(
     "--warmup-percent",
     type=float,
-    default=GenerativeTextScenario.model_fields["warmup_percent"].default,
+    default=GenerativeTextScenario.get_default("warmup_percent"),
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, "
         "or lenth of dataset) to run as a warmup and not include in the final results. "
@@ -185,7 +185,7 @@ def cli():
 @click.option(
     "--cooldown-percent",
     type=float,
-    default=GenerativeTextScenario.model_fields["cooldown_percent"].default,
+    default=GenerativeTextScenario.get_default("cooldown_percent"),
     help=(
         "The percent of the benchmark (based on max-seconds, max-requets, or lenth "
         "of dataset) to run as a cooldown and not include in the final results. "
@@ -230,11 +230,11 @@ def cli():
         "The number of samples to save in the output file. "
         "If None (default), will save all samples."
     ),
-    default=GenerativeTextScenario.model_fields["output_sampling"].default,
+    default=GenerativeTextScenario.get_default("output_sampling"),
 )
 @click.option(
     "--random-seed",
-    default=GenerativeTextScenario.model_fields["random_seed"].default,
+    default=GenerativeTextScenario.get_default("random_seed"),
     type=int,
     help="The random seed to use for benchmarking to ensure reproducibility.",
 )
diff --git a/src/guidellm/benchmark/entrypoints.py b/src/guidellm/benchmark/entrypoints.py
index 421904a2c..fcb69ce9b 100644
--- a/src/guidellm/benchmark/entrypoints.py
+++ b/src/guidellm/benchmark/entrypoints.py
@@ -19,8 +19,6 @@
 from guidellm.request import GenerativeRequestLoader
 from guidellm.scheduler import StrategyType
 
-type benchmark_type = Literal["generative_text"]
-
 
 async def benchmark_with_scenario(scenario: Scenario, **kwargs):
     """
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 36f2fbd4b..88a58a965 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -41,6 +41,11 @@ def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
 class Scenario(StandardBaseModel):
     target: str
 
+    @classmethod
+    def get_default(cls: type[T], field: str) -> Any:
+        """Get default values for model fields"""
+        return cls.model_fields[field].default
+
     @classmethod
     def from_file(
         cls: type[T], filename: Union[str, Path], overrides: Optional[dict] = None

From bc937b5b60c72ccd50a733bb943c37da0f9def10 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 22 May 2025 13:34:15 -0400
Subject: [PATCH 10/18] Move scenario helper methods to base pydantic class

---
 src/guidellm/__main__.py           |  2 +-
 src/guidellm/benchmark/scenario.py | 30 +-----------------------------
 src/guidellm/objects/pydantic.py   | 28 +++++++++++++++++++++++++++-
 3 files changed, 29 insertions(+), 31 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index cbecf9aeb..ee9e3c017 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -292,7 +292,7 @@ def benchmark(
             _scenario = GenerativeTextScenario.model_validate(overrides)
         else:
             # TODO: Support pre-defined scenarios
-            _scenario = GenerativeTextScenario.from_file(scenario, overrides)
+            _scenario = GenerativeTextScenario.from_file(Path(scenario), overrides)
     except ValidationError as e:
         errs = e.errors(include_url=False, include_context=True, include_input=True)
         param_name = "--" + str(errs[0]["loc"][0]).replace("_", "-")
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 88a58a965..8de73af00 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -1,11 +1,8 @@
-import json
 from collections.abc import Iterable
 from pathlib import Path
-from typing import Annotated, Any, Literal, Optional, TypeVar, Union
+from typing import Annotated, Any, Literal, Optional, Union
 
-import yaml
 from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
-from loguru import logger
 from pydantic import BeforeValidator, Field, NonNegativeInt, PositiveFloat, PositiveInt
 from transformers.tokenization_utils_base import (  # type: ignore[import]
     PreTrainedTokenizerBase,
@@ -35,34 +32,9 @@ def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
         ) from err
 
 
-T = TypeVar("T", bound="Scenario")
-
-
 class Scenario(StandardBaseModel):
     target: str
 
-    @classmethod
-    def get_default(cls: type[T], field: str) -> Any:
-        """Get default values for model fields"""
-        return cls.model_fields[field].default
-
-    @classmethod
-    def from_file(
-        cls: type[T], filename: Union[str, Path], overrides: Optional[dict] = None
-    ) -> T:
-        try:
-            with open(filename) as f:
-                if str(filename).endswith(".yaml") or str(filename).endswith(".yml"):
-                    data = yaml.safe_load(f)
-                else:  # Assume everything else is json
-                    data = json.load(f)
-        except (json.JSONDecodeError, yaml.YAMLError) as e:
-            logger.error("Failed to parse scenario")
-            raise e
-
-        data.update(overrides)
-        return cls.model_validate(data)
-
 
 class GenerativeTextScenario(Scenario):
     # FIXME: This solves an issue with Pydantic and class types
diff --git a/src/guidellm/objects/pydantic.py b/src/guidellm/objects/pydantic.py
index 8365be331..27be1fc13 100644
--- a/src/guidellm/objects/pydantic.py
+++ b/src/guidellm/objects/pydantic.py
@@ -1,10 +1,14 @@
-from typing import Any, Generic, TypeVar
+import json
+from pathlib import Path
+from typing import Any, Generic, Optional, TypeVar
 
+import yaml
 from loguru import logger
 from pydantic import BaseModel, ConfigDict, Field
 
 __all__ = ["StandardBaseModel", "StatusBreakdown"]
 
+T = TypeVar("T", bound="StandardBaseModel")
 
 class StandardBaseModel(BaseModel):
     """
@@ -27,6 +31,28 @@ def __init__(self, /, **data: Any) -> None:
             data,
         )
 
+    @classmethod
+    def get_default(cls: type[T], field: str) -> Any:
+        """Get default values for model fields"""
+        return cls.model_fields[field].default
+
+    @classmethod
+    def from_file(
+        cls: type[T], filename: Path, overrides: Optional[dict] = None
+    ) -> T:
+        try:
+            with filename.open() as f:
+                if str(filename).endswith((".yaml", ".yml")):
+                    data = yaml.safe_load(f)
+                else:  # Assume everything else is json
+                    data = json.load(f)
+        except (json.JSONDecodeError, yaml.YAMLError) as e:
+            logger.error(f"Failed to parse {filename} as type {cls.__name__}")
+            raise e
+
+        data.update(overrides)
+        return cls.model_validate(data)
+
 
 SuccessfulT = TypeVar("SuccessfulT")
 ErroredT = TypeVar("ErroredT")

From cf31319b55a5e773a3880302e6d4596293e105bc Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 22 May 2025 13:43:34 -0400
Subject: [PATCH 11/18] Move cli helpers to separate file and add click Union
 type back

---
 src/guidellm/__main__.py  | 45 ++++++++--------------------
 src/guidellm/utils/cli.py | 63 +++++++++++++++++++++++++++++++++++++++
 2 files changed, 76 insertions(+), 32 deletions(-)
 create mode 100644 src/guidellm/utils/cli.py

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index ee9e3c017..51ea49521 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -1,8 +1,7 @@
 import asyncio
 import codecs
-import json
 from pathlib import Path
-from typing import Any, get_args
+from typing import get_args
 
 import click
 from pydantic import ValidationError
@@ -14,34 +13,13 @@
 from guidellm.config import print_config
 from guidellm.preprocess.dataset import ShortPromptStrategy, process_dataset
 from guidellm.scheduler import StrategyType
+from guidellm.utils import cli as cli_tools
 
 STRATEGY_PROFILE_CHOICES = set(
     list(get_args(ProfileType)) + list(get_args(StrategyType))
 )
 
 
-def parse_json(ctx, param, value):  # noqa: ARG001
-    if value is None:
-        return None
-    try:
-        return json.loads(value)
-    except json.JSONDecodeError as err:
-        raise click.BadParameter(f"{param.name} must be a valid JSON string.") from err
-
-
-def set_if_not_default(ctx: click.Context, **kwargs) -> dict[str, Any]:
-    """
-    Set the value of a click option if it is not the default value.
-    This is useful for setting options that are not None by default.
-    """
-    values = {}
-    for k, v in kwargs.items():
-        if ctx.get_parameter_source(k) != click.core.ParameterSource.DEFAULT:
-            values[k] = v
-
-    return values
-
-
 @click.group()
 def cli():
     pass
@@ -52,7 +30,10 @@ def cli():
 )
 @click.option(
     "--scenario",
-    type=str,
+    type=cli_tools.Union(
+        click.Path(exists=True, readable=True, file_okay=True, dir_okay=False),
+        click.STRING
+    ),
     default=None,
     help=("TODO: A scenario or path to config"),
 )
@@ -72,7 +53,7 @@ def cli():
 )
 @click.option(
     "--backend-args",
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     default=GenerativeTextScenario.get_default("backend_args"),
     help=(
         "A JSON string containing any arguments to pass to the backend as a "
@@ -101,7 +82,7 @@ def cli():
 @click.option(
     "--processor-args",
     default=GenerativeTextScenario.get_default("processor_args"),
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     help=(
         "A JSON string containing any arguments to pass to the processor constructor "
         "as a dict with **kwargs."
@@ -119,7 +100,7 @@ def cli():
 @click.option(
     "--data-args",
     default=GenerativeTextScenario.get_default("data_args"),
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     help=(
         "A JSON string containing any arguments to pass to the dataset creation "
         "as a dict with **kwargs."
@@ -220,7 +201,7 @@ def cli():
 )
 @click.option(
     "--output-extras",
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     help="A JSON string of extra data to save with the output benchmarks",
 )
 @click.option(
@@ -265,7 +246,7 @@ def benchmark(
 ):
     click_ctx = click.get_current_context()
 
-    overrides = set_if_not_default(
+    overrides = cli_tools.set_if_not_default(
         click_ctx,
         target=target,
         backend_type=backend_type,
@@ -370,7 +351,7 @@ def preprocess():
 @click.option(
     "--processor-args",
     default=None,
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     help=(
         "A JSON string containing any arguments to pass to the processor constructor "
         "as a dict with **kwargs."
@@ -378,7 +359,7 @@ def preprocess():
 )
 @click.option(
     "--data-args",
-    callback=parse_json,
+    callback=cli_tools.parse_json,
     help=(
         "A JSON string containing any arguments to pass to the dataset creation "
         "as a dict with **kwargs."
diff --git a/src/guidellm/utils/cli.py b/src/guidellm/utils/cli.py
new file mode 100644
index 000000000..507a384b8
--- /dev/null
+++ b/src/guidellm/utils/cli.py
@@ -0,0 +1,63 @@
+import json
+from typing import Any
+
+import click
+
+
+def parse_json(ctx, param, value):  # noqa: ARG001
+    if value is None:
+        return None
+    try:
+        return json.loads(value)
+    except json.JSONDecodeError as err:
+        raise click.BadParameter(f"{param.name} must be a valid JSON string.") from err
+
+
+def set_if_not_default(ctx: click.Context, **kwargs) -> dict[str, Any]:
+    """
+    Set the value of a click option if it is not the default value.
+    This is useful for setting options that are not None by default.
+    """
+    values = {}
+    for k, v in kwargs.items():
+        if ctx.get_parameter_source(k) != click.core.ParameterSource.DEFAULT:
+            values[k] = v
+
+    return values
+
+
+class Union(click.ParamType):
+    """
+    A custom click parameter type that allows for multiple types to be accepted.
+    """
+
+    def __init__(self, *types: click.ParamType):
+        self.types = types
+        self.name = "".join(t.name for t in types)
+
+    def convert(self, value, param, ctx):
+        fails = []
+        for t in self.types:
+            try:
+                return t.convert(value, param, ctx)
+            except click.BadParameter as e:
+                fails.append(str(e))
+                continue
+
+        self.fail("; ".join(fails) or f"Invalid value: {value}")  # noqa: RET503
+
+
+    def get_metavar(self, param: click.Parameter) -> str:
+        def get_choices(t: click.ParamType) -> str:
+            meta = t.get_metavar(param)
+            return meta if meta is not None else t.name
+
+        # Get the choices for each type in the union.
+        choices_str = "|".join(map(get_choices, self.types))
+
+        # Use curly braces to indicate a required argument.
+        if param.required and param.param_type_name == "argument":
+            return f"{{{choices_str}}}"
+
+        # Use square braces to indicate an option or optional argument.
+        return f"[{choices_str}]"

From 257cc9ed3e0c9caf0f19520f94ba63d1344afab9 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 22 May 2025 14:19:52 -0400
Subject: [PATCH 12/18] Properly detect if scenario is a Path

---
 src/guidellm/__main__.py  | 14 +++++++++++---
 src/guidellm/utils/cli.py |  2 +-
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 51ea49521..2764cd11a 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -31,7 +31,13 @@ def cli():
 @click.option(
     "--scenario",
     type=cli_tools.Union(
-        click.Path(exists=True, readable=True, file_okay=True, dir_okay=False),
+        click.Path(
+            exists=True,
+            readable=True,
+            file_okay=True,
+            dir_okay=False,
+            path_type=Path,  # type: ignore[type-var]
+        ),
         click.STRING
     ),
     default=None,
@@ -271,9 +277,11 @@ def benchmark(
         # If a scenario file was specified read from it
         if scenario is None:
             _scenario = GenerativeTextScenario.model_validate(overrides)
+        elif isinstance(scenario, Path):
+            _scenario = GenerativeTextScenario.from_file(scenario, overrides)
         else:
-            # TODO: Support pre-defined scenarios
-            _scenario = GenerativeTextScenario.from_file(Path(scenario), overrides)
+            # TODO: Add support for builtin scenarios
+            raise NotImplementedError
     except ValidationError as e:
         errs = e.errors(include_url=False, include_context=True, include_input=True)
         param_name = "--" + str(errs[0]["loc"][0]).replace("_", "-")
diff --git a/src/guidellm/utils/cli.py b/src/guidellm/utils/cli.py
index 507a384b8..9af6359ba 100644
--- a/src/guidellm/utils/cli.py
+++ b/src/guidellm/utils/cli.py
@@ -20,7 +20,7 @@ def set_if_not_default(ctx: click.Context, **kwargs) -> dict[str, Any]:
     """
     values = {}
     for k, v in kwargs.items():
-        if ctx.get_parameter_source(k) != click.core.ParameterSource.DEFAULT:
+        if ctx.get_parameter_source(k) != click.core.ParameterSource.DEFAULT:  # type: ignore[attr-defined]
             values[k] = v
 
     return values

From aa6dc138618267a66f15e0cf8ef9a5050231a430 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Thu, 22 May 2025 14:32:45 -0400
Subject: [PATCH 13/18] Set defaults for console output

---
 src/guidellm/benchmark/entrypoints.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/guidellm/benchmark/entrypoints.py b/src/guidellm/benchmark/entrypoints.py
index fcb69ce9b..ce43fca3e 100644
--- a/src/guidellm/benchmark/entrypoints.py
+++ b/src/guidellm/benchmark/entrypoints.py
@@ -55,13 +55,13 @@ async def benchmark_generative_text(
     max_requests: Optional[int],
     warmup_percent: Optional[float],
     cooldown_percent: Optional[float],
-    show_progress: bool,
-    show_progress_scheduler_stats: bool,
-    output_console: bool,
     output_path: Optional[Union[str, Path]],
     output_extras: Optional[dict[str, Any]],
     output_sampling: Optional[int],
     random_seed: int,
+    show_progress: bool = True,
+    show_progress_scheduler_stats: bool = False,
+    output_console: bool = True,
 ) -> tuple[GenerativeBenchmarksReport, Optional[Path]]:
     console = GenerativeBenchmarksConsole(enabled=show_progress)
     console.print_line("Creating backend...")

From f3d9d067d7b9b1df6663926f185597129bf72def Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Fri, 23 May 2025 15:38:48 -0400
Subject: [PATCH 14/18] Add builtin scenarios

---
 src/guidellm/__main__.py                     |  7 +++---
 src/guidellm/benchmark/scenario.py           | 24 ++++++++++++++++++--
 src/guidellm/benchmark/scenarios/__init__.py |  0
 3 files changed, 25 insertions(+), 6 deletions(-)
 create mode 100644 src/guidellm/benchmark/scenarios/__init__.py

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 2764cd11a..3589064ef 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -9,7 +9,7 @@
 from guidellm.backend import BackendType
 from guidellm.benchmark import ProfileType
 from guidellm.benchmark.entrypoints import benchmark_with_scenario
-from guidellm.benchmark.scenario import GenerativeTextScenario
+from guidellm.benchmark.scenario import GenerativeTextScenario, get_builtin_scenarios
 from guidellm.config import print_config
 from guidellm.preprocess.dataset import ShortPromptStrategy, process_dataset
 from guidellm.scheduler import StrategyType
@@ -38,7 +38,7 @@ def cli():
             dir_okay=False,
             path_type=Path,  # type: ignore[type-var]
         ),
-        click.STRING
+        click.Choice(get_builtin_scenarios()),
     ),
     default=None,
     help=("TODO: A scenario or path to config"),
@@ -280,8 +280,7 @@ def benchmark(
         elif isinstance(scenario, Path):
             _scenario = GenerativeTextScenario.from_file(scenario, overrides)
         else:
-            # TODO: Add support for builtin scenarios
-            raise NotImplementedError
+            _scenario = GenerativeTextScenario.from_builtin(scenario, overrides)
     except ValidationError as e:
         errs = e.errors(include_url=False, include_context=True, include_input=True)
         param_name = "--" + str(errs[0]["loc"][0]).replace("_", "-")
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 8de73af00..8198ed6fa 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -1,6 +1,7 @@
 from collections.abc import Iterable
+from functools import cache
 from pathlib import Path
-from typing import Annotated, Any, Literal, Optional, Union
+from typing import Annotated, Any, Literal, Optional, TypeVar, Union
 
 from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
 from pydantic import BeforeValidator, Field, NonNegativeInt, PositiveFloat, PositiveInt
@@ -13,7 +14,14 @@
 from guidellm.objects.pydantic import StandardBaseModel
 from guidellm.scheduler.strategy import StrategyType
 
-__ALL__ = ["Scenario", "GenerativeTextScenario"]
+__ALL__ = ["Scenario", "GenerativeTextScenario", "get_builtin_scenarios"]
+
+SCENARIO_DIR = Path(__file__).parent / "scenarios/"
+
+
+@cache
+def get_builtin_scenarios() -> list[str]:
+    return [p.stem for p in SCENARIO_DIR.glob("*.json")]
 
 
 def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
@@ -32,9 +40,21 @@ def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
         ) from err
 
 
+T = TypeVar("T", bound="Scenario")
+
+
 class Scenario(StandardBaseModel):
     target: str
 
+    @classmethod
+    def from_builtin(cls: type[T], name: str, overrides: Optional[dict] = None) -> T:
+        filename = SCENARIO_DIR / f"{name}.json"
+
+        if not filename.is_file():
+            raise ValueError(f"{name} is not a vaild builtin scenario")
+
+        return cls.from_file(filename, overrides)
+
 
 class GenerativeTextScenario(Scenario):
     # FIXME: This solves an issue with Pydantic and class types
diff --git a/src/guidellm/benchmark/scenarios/__init__.py b/src/guidellm/benchmark/scenarios/__init__.py
new file mode 100644
index 000000000..e69de29bb

From 0ecf7b11712cd67edd53ec79176989a531fac633 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Fri, 23 May 2025 16:04:26 -0400
Subject: [PATCH 15/18] Documentation pass

---
 src/guidellm/__main__.py           |  9 +++++++--
 src/guidellm/benchmark/scenario.py | 19 +++++++++++++++++--
 src/guidellm/objects/pydantic.py   | 11 +++++++----
 3 files changed, 31 insertions(+), 8 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index 3589064ef..dc09e85bb 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -41,7 +41,11 @@ def cli():
         click.Choice(get_builtin_scenarios()),
     ),
     default=None,
-    help=("TODO: A scenario or path to config"),
+    help=(
+        "The name of a builtin scenario or path to a config file. "
+        "Missing values from the config will use defaults. "
+        "Options specified on the commandline will override the scenario."
+    ),
 )
 @click.option(
     "--target",
@@ -279,9 +283,10 @@ def benchmark(
             _scenario = GenerativeTextScenario.model_validate(overrides)
         elif isinstance(scenario, Path):
             _scenario = GenerativeTextScenario.from_file(scenario, overrides)
-        else:
+        else:  # Only builtins can make it here; click will catch anything else
             _scenario = GenerativeTextScenario.from_builtin(scenario, overrides)
     except ValidationError as e:
+        # Translate pydantic valdation error to click argument error
         errs = e.errors(include_url=False, include_context=True, include_input=True)
         param_name = "--" + str(errs[0]["loc"][0]).replace("_", "-")
         raise click.BadParameter(
diff --git a/src/guidellm/benchmark/scenario.py b/src/guidellm/benchmark/scenario.py
index 8198ed6fa..af43e4262 100644
--- a/src/guidellm/benchmark/scenario.py
+++ b/src/guidellm/benchmark/scenario.py
@@ -21,10 +21,16 @@
 
 @cache
 def get_builtin_scenarios() -> list[str]:
+    """Returns list of builtin scenario names."""
     return [p.stem for p in SCENARIO_DIR.glob("*.json")]
 
 
 def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
+    """
+    Parse a comma separated string to a list of float
+    or convert single float list of one or pass float
+    list through.
+    """
     if isinstance(value, (int, float)):
         return [value]
     elif isinstance(value, list):
@@ -44,6 +50,10 @@ def parse_float_list(value: Union[str, float, list[float]]) -> list[float]:
 
 
 class Scenario(StandardBaseModel):
+    """
+    Parent Scenario class with common options for all benchmarking types.
+    """
+
     target: str
 
     @classmethod
@@ -51,14 +61,19 @@ def from_builtin(cls: type[T], name: str, overrides: Optional[dict] = None) -> T
         filename = SCENARIO_DIR / f"{name}.json"
 
         if not filename.is_file():
-            raise ValueError(f"{name} is not a vaild builtin scenario")
+            raise ValueError(f"{name} is not a valid builtin scenario")
 
         return cls.from_file(filename, overrides)
 
 
 class GenerativeTextScenario(Scenario):
-    # FIXME: This solves an issue with Pydantic and class types
+    """
+    Scenario class for generative text benchmarks.
+    """
+
     class Config:
+        # NOTE: This prevents errors due to unvalidatable
+        # types like PreTrainedTokenizerBase
         arbitrary_types_allowed = True
 
     backend_type: BackendType = "openai_http"
diff --git a/src/guidellm/objects/pydantic.py b/src/guidellm/objects/pydantic.py
index 27be1fc13..f4b1e2dae 100644
--- a/src/guidellm/objects/pydantic.py
+++ b/src/guidellm/objects/pydantic.py
@@ -10,6 +10,7 @@
 
 T = TypeVar("T", bound="StandardBaseModel")
 
+
 class StandardBaseModel(BaseModel):
     """
     A base class for Pydantic models throughout GuideLLM enabling standard
@@ -37,9 +38,11 @@ def get_default(cls: type[T], field: str) -> Any:
         return cls.model_fields[field].default
 
     @classmethod
-    def from_file(
-        cls: type[T], filename: Path, overrides: Optional[dict] = None
-    ) -> T:
+    def from_file(cls: type[T], filename: Path, overrides: Optional[dict] = None) -> T:
+        """
+        Attempt to create a new instance of the model using
+        data loaded from json or yaml file.
+        """
         try:
             with filename.open() as f:
                 if str(filename).endswith((".yaml", ".yml")):
@@ -48,7 +51,7 @@ def from_file(
                     data = json.load(f)
         except (json.JSONDecodeError, yaml.YAMLError) as e:
             logger.error(f"Failed to parse {filename} as type {cls.__name__}")
-            raise e
+            raise ValueError(f"Error when parsing file: {filename}") from e
 
         data.update(overrides)
         return cls.model_validate(data)

From 15fd7f5e02dab4b92697553140149ac922261c5c Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Fri, 23 May 2025 16:13:40 -0400
Subject: [PATCH 16/18] Add default scenarios

---
 .gitignore                                 |  3 +++
 src/guidellm/benchmark/scenarios/chat.json | 13 +++++++++++++
 src/guidellm/benchmark/scenarios/rag.json  | 13 +++++++++++++
 3 files changed, 29 insertions(+)
 create mode 100644 src/guidellm/benchmark/scenarios/chat.json
 create mode 100644 src/guidellm/benchmark/scenarios/rag.json

diff --git a/.gitignore b/.gitignore
index 5742e6e3c..af2528b38 100644
--- a/.gitignore
+++ b/.gitignore
@@ -179,6 +179,9 @@ cython_debug/
 *.json
 *.yaml
 
+# But not scenarios
+!src/guidellm/benchmark/scenarios/*.json
+!src/guidellm/benchmark/scenarios/*.yaml
 
 # UI Section - Next.js/React application under src/ui/
 # dependencies
diff --git a/src/guidellm/benchmark/scenarios/chat.json b/src/guidellm/benchmark/scenarios/chat.json
new file mode 100644
index 000000000..024438c54
--- /dev/null
+++ b/src/guidellm/benchmark/scenarios/chat.json
@@ -0,0 +1,13 @@
+{
+    "rate_type": "sweep",
+    "data": {
+        "prompt_tokens": 512,
+        "prompt_tokens_stdev": 128,
+        "prompt_tokens_min": 1,
+        "prompt_tokens_max": 1024,
+        "output_tokens": 256,
+        "output_tokens_stdev": 64,
+        "output_tokens_min": 1,
+        "output_tokens_max": 1024
+    }
+}
diff --git a/src/guidellm/benchmark/scenarios/rag.json b/src/guidellm/benchmark/scenarios/rag.json
new file mode 100644
index 000000000..c7ee2f273
--- /dev/null
+++ b/src/guidellm/benchmark/scenarios/rag.json
@@ -0,0 +1,13 @@
+{
+    "rate_type": "sweep",
+    "data": {
+        "prompt_tokens": 4096,
+        "prompt_tokens_stdev": 512,
+        "prompt_tokens_min": 2048,
+        "prompt_tokens_max": 6144,
+        "output_tokens": 512,
+        "output_tokens_stdev": 128,
+        "output_tokens_min": 1,
+        "output_tokens_max": 1024
+    }
+}

From 57468c1ff821268b3d9ac5d587d14bf293a32bac Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Mon, 9 Jun 2025 11:46:52 -0400
Subject: [PATCH 17/18] Allow CLI arguments to be set through ENV

---
 src/guidellm/__main__.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/guidellm/__main__.py b/src/guidellm/__main__.py
index dc09e85bb..9e8a12fb9 100644
--- a/src/guidellm/__main__.py
+++ b/src/guidellm/__main__.py
@@ -26,7 +26,8 @@ def cli():
 
 
 @cli.command(
-    help="Run a benchmark against a generative model using the specified arguments."
+    help="Run a benchmark against a generative model using the specified arguments.",
+    context_settings={"auto_envvar_prefix": "GUIDELLM"},
 )
 @click.option(
     "--scenario",
@@ -339,7 +340,8 @@ def preprocess():
         "Convert a dataset to have specific prompt and output token sizes.\n"
         "DATA: Path to the input dataset or dataset ID.\n"
         "OUTPUT_PATH: Path to save the converted dataset, including file suffix."
-    )
+    ),
+    context_settings={"auto_envvar_prefix": "GUIDELLM"},
 )
 @click.argument(
     "data",

From 5e484c41efd3bc4ec3141710c4e993ad858184d6 Mon Sep 17 00:00:00 2001
From: Samuel Monson <smonson@redhat.com>
Date: Tue, 10 Jun 2025 11:02:28 -0400
Subject: [PATCH 18/18] Switch to assuming everything is yaml

---
 src/guidellm/objects/pydantic.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/guidellm/objects/pydantic.py b/src/guidellm/objects/pydantic.py
index f4b1e2dae..fcededcf9 100644
--- a/src/guidellm/objects/pydantic.py
+++ b/src/guidellm/objects/pydantic.py
@@ -45,10 +45,10 @@ def from_file(cls: type[T], filename: Path, overrides: Optional[dict] = None) ->
         """
         try:
             with filename.open() as f:
-                if str(filename).endswith((".yaml", ".yml")):
-                    data = yaml.safe_load(f)
-                else:  # Assume everything else is json
+                if str(filename).endswith(".json"):
                     data = json.load(f)
+                else:  # Assume everything else is yaml
+                    data = yaml.safe_load(f)
         except (json.JSONDecodeError, yaml.YAMLError) as e:
             logger.error(f"Failed to parse {filename} as type {cls.__name__}")
             raise ValueError(f"Error when parsing file: {filename}") from e