Skip to content

Commit

Permalink
detokenize = False for benchmarks
Browse files Browse the repository at this point in the history
  • Loading branch information
maleksan85 committed Jan 17, 2025
1 parent c566cd9 commit 87d256a
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 0 deletions.
1 change: 1 addition & 0 deletions benchmarks/profiling/benchmark_latency.py
Original file line number Diff line number Diff line change
Expand Up @@ -81,6 +81,7 @@ def get_profiling_context(profile_result_dir: Optional[str] = None):
top_p=1.0,
ignore_eos=True,
max_tokens=args.output_len,
detokenize = False,
)
print(sampling_params)
dummy_prompt_token_ids = np.random.randint(10000,
Expand Down
2 changes: 2 additions & 0 deletions benchmarks/profiling/benchmark_throughput.py
Original file line number Diff line number Diff line change
Expand Up @@ -135,6 +135,7 @@ def get_profiling_context(profile_dir: Optional[str] = None):
top_p=1.0,
ignore_eos=True,
max_tokens=output_len,
detokenize = False,
))

if args.profile_torch or args.profile_rpd:
Expand Down Expand Up @@ -171,6 +172,7 @@ async def run_vllm_async(
top_p=1.0,
ignore_eos=True,
max_tokens=output_len,
detokenize = False,
))

generators = []
Expand Down

0 comments on commit 87d256a

Please sign in to comment.