Skip to content

Commit 820dfe8

Browse files
committed
Update inference.py
1 parent 972e75c commit 820dfe8

File tree

1 file changed

+1
-2
lines changed

1 file changed

+1
-2
lines changed

optillm/inference.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1277,8 +1277,7 @@ def get_optimized_generation_config(self, generation_params: Optional[Dict[str,
12771277
"eos_token_id": self.tokenizer.eos_token_id,
12781278
"return_dict_in_generate": True,
12791279
"output_scores": generation_params.get("logprobs", False),
1280-
"use_cache": True,
1281-
"return_legacy_cache": True, # To avoid warning
1280+
"use_cache": True
12821281
}
12831282
return config
12841283

0 commit comments

Comments
 (0)