Skip to content

Commit 4053857

Browse files
committed
server: support flash_attn param
1 parent 599ce84 commit 4053857

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

examples/server/server.cpp

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2722,6 +2722,8 @@ static void server_params_parse(int argc, char ** argv, server_params & sparams,
27222722
params.embedding = true;
27232723
} else if (arg == "-cb" || arg == "--cont-batching") {
27242724
params.cont_batching = true;
2725+
} else if (arg == "-fa" || arg == "--flash-attn") {
2726+
params.flash_attn = true;
27252727
} else if (arg == "-np" || arg == "--parallel") {
27262728
if (++i >= argc) {
27272729
invalid_param = true;

0 commit comments

Comments
 (0)