Skip to content

Commit f0e3718

Browse files
committed
feat(cli): add b200 and h200 GPU options for endpoint creation
1 parent 876f1ca commit f0e3718

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

src/together/cli/api/endpoints.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -98,7 +98,7 @@ def endpoints(ctx: click.Context) -> None:
9898
)
9999
@click.option(
100100
"--gpu",
101-
type=click.Choice(["h100", "a100", "l40", "l40s", "rtx-6000"]),
101+
type=click.Choice(["b200", "h200", "h100", "a100", "l40", "l40s", "rtx-6000"]),
102102
required=True,
103103
help="GPU type to use for inference",
104104
)
@@ -161,6 +161,8 @@ def create(
161161
"""Create a new dedicated inference endpoint."""
162162
# Map GPU types to their full hardware ID names
163163
gpu_map = {
164+
"b200": "nvidia_b200_180gb_sxm",
165+
"h200": "nvidia_h200_140gb_sxm",
164166
"h100": "nvidia_h100_80gb_sxm",
165167
"a100": "nvidia_a100_80gb_pcie" if gpu_count == 1 else "nvidia_a100_80gb_sxm",
166168
"l40": "nvidia_l40",

0 commit comments

Comments
 (0)