We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
--skip-tokenizer-init
echo and return_token_ids
1 parent 78c1d5b commit a964e5eCopy full SHA for a964e5e
tests/entrypoints/openai/test_token_in_token_out.py
@@ -54,7 +54,7 @@ async def test_token_in_token_out_and_logprobs(server):
54
prompt=token_ids,
55
max_tokens=20,
56
temperature=0,
57
- echo=False,
+ echo=True,
58
extra_body={
59
"return_token_ids": True,
60
},
vllm/entrypoints/openai/serving_completion.py
@@ -691,5 +691,6 @@ def _build_render_config(
691
truncate_prompt_tokens=request.truncate_prompt_tokens,
692
add_special_tokens=request.add_special_tokens,
693
cache_salt=request.cache_salt,
694
- needs_detokenization=bool(request.echo),
+ needs_detokenization=bool(request.echo
695
+ and not request.return_token_ids),
696
)
0 commit comments