Skip to content

Commit 05a9d13

Browse files
author
Your Name
committed
defautl size
1 parent 647d71f commit 05a9d13

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/beam/filtering.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@ def format_filter(filter_params_list):
3030

3131
MAX_GENERATIONS = 10
3232
_CHUNK_SIZE = 16
33-
33+
_DEFAULT_BEAM_SIZE = 3
3434

3535
class BeamValidator:
3636
def __init__(self, classi_idx, classifier_names):
@@ -42,7 +42,7 @@ async def get_n_valid_beams(self, create_completion: Callable,
4242
raw_request: Optional[Request] = None) -> list[
4343
Union[AsyncGenerator[str, None], CompletionResponse, ErrorResponse]]:
4444
request.stream = False
45-
n = request.n
45+
n = request.n if request.n > 1 else _DEFAULT_BEAM_SIZE
4646
request.n = 1
4747
# TODO(@tanuj): accept max tokens as a parameter
4848
request.max_tokens = _CHUNK_SIZE

0 commit comments

Comments
 (0)