Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -1,3 +1,5 @@
# Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

import json
import logging
import math
Expand All @@ -24,9 +26,6 @@ def test_inference_pipeline(golden_values_path: str, test_values_path: str) -> N
# Handle JSONL output, assume only one line in this case.
output_current = json.loads(output_current)

assert set(output_groundtruth.keys()).issuperset(
set(output_current.keys())
), f"Some IDs from groundtruth are missing in current: {output_groundtruth.keys()} vs {output_current.keys()}"
if set(output_groundtruth.keys()) != set(output_current.keys()):
logger.warning(
f"Some IDs from groundtruth are missing in output, only the subset of ids in groundtruth will be tested: {output_groundtruth.keys()} vs {output_current.keys()}"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -156,6 +156,5 @@
-1.2342015504837036,
-0.5394397377967834
]
},
"throughput": 6.543502517233578
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -75,7 +75,7 @@ MODEL_ARGS:
--output-path: ${TENSORBOARD_PATH}
--prompts: "Time travel to 2008, and go to a bar or a club or one of the myriad disco-basements on the Lower East Side that does not quite know which of those it is. Dance awkwardly in a room full of other glittered-up nerds, and wait for something to happen, buoyed on the feeling that this is the big swollen heart of life, that this is New York like the movies."
--incoming-requests-per-sec: -1 # all requests arrive up front.
--inference-repeat-n: 8
--inference-repeat-n: 1
METRICS:
- "generated_tokens"
- "logprobs"
Loading