File tree Expand file tree Collapse file tree 2 files changed +6
-0
lines changed Expand file tree Collapse file tree 2 files changed +6
-0
lines changed Original file line number Diff line number Diff line change @@ -189,5 +189,8 @@ def run_to_completion(profile_dir: Optional[str] = None):
189
189
)
190
190
191
191
parser = EngineArgs .add_cli_args (parser )
192
+ # V1 enables prefix caching by default which skews the latency
193
+ # numbers. We need to disable prefix caching by default.
194
+ parser .set_defaults (enable_prefix_caching = False )
192
195
args = parser .parse_args ()
193
196
main (args )
Original file line number Diff line number Diff line change @@ -80,6 +80,9 @@ def add_cli_args(parser: argparse.ArgumentParser):
80
80
)
81
81
82
82
parser = EngineArgs .add_cli_args (parser )
83
+ # V1 enables prefix caching by default which skews the latency
84
+ # numbers. We need to disable prefix caching by default.
85
+ parser .set_defaults (enable_prefix_caching = True )
83
86
84
87
85
88
def main (args : argparse .Namespace ):
You can’t perform that action at this time.
0 commit comments