We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4053857 commit 5668c79Copy full SHA for 5668c79
examples/server/bench/bench.py
@@ -268,6 +268,7 @@ def start_server_background(args):
268
server_args.extend(['--defrag-thold', "0.1"])
269
server_args.append('--cont-batching')
270
server_args.append('--metrics')
271
+ server_args.append('--flash-attn')
272
server_args.extend(['--log-format', "text"])
273
args = [str(arg) for arg in [server_path, *server_args]]
274
print(f"bench: starting server with: {' '.join(args)}")
0 commit comments