We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 32176fe commit feb92fbCopy full SHA for feb92fb
vllm/engine/protocol.py
@@ -140,7 +140,12 @@ async def beam_search(
140
best_beams = sorted_completed[:beam_width]
141
142
for beam in best_beams:
143
- beam.text = tokenizer.decode(beam.tokens[tokenized_length:])
+ if (beam.tokens[-1] == tokenizer.eos_token_id and not ignore_eos):
144
+ # Skip the eos token in the text.
145
+ tokens = beam.tokens[tokenized_length:-1]
146
+ else:
147
+ tokens = beam.tokens[tokenized_length:]
148
+ beam.text = tokenizer.decode(tokens)
149
150
beam_search_output = RequestOutput(
151
request_id=request_id,
0 commit comments