File tree Expand file tree Collapse file tree 2 files changed +6
-0
lines changed Expand file tree Collapse file tree 2 files changed +6
-0
lines changed Original file line number Diff line number Diff line change @@ -189,5 +189,8 @@ def run_to_completion(profile_dir: Optional[str] = None):
189189 )
190190
191191 parser = EngineArgs .add_cli_args (parser )
192+ # V1 enables prefix caching by default which skews the latency
193+ # numbers. We need to disable prefix caching by default.
194+ parser .set_defaults (enable_prefix_caching = False )
192195 args = parser .parse_args ()
193196 main (args )
Original file line number Diff line number Diff line change @@ -80,6 +80,9 @@ def add_cli_args(parser: argparse.ArgumentParser):
8080 )
8181
8282 parser = EngineArgs .add_cli_args (parser )
83+ # V1 enables prefix caching by default which skews the latency
84+ # numbers. We need to disable prefix caching by default.
85+ parser .set_defaults (enable_prefix_caching = True )
8386
8487
8588def main (args : argparse .Namespace ):
You can’t perform that action at this time.
0 commit comments